PLEAC = Language Examples Alike Cookbook PLEAC examples are drawn from the "Perl Cookbook" by Tom Christiansen & Nathan Torkington, published by O'Reilly. They provide a nice range of examples oriented toward data munging, the type of work I tend to want to do first when learning a new language.
The Julia examples below are principally translations from the Python version
I'm learning as I go, so the code below probably doesn't represent best practice. Your suggestions are welcome! Please file an issue or make a pull request to the github repo.
The examples are not complete. Missing items are generally noted in comments.
#make a file
contents="""Here are
a few
lines of
text content."""
fo=open("julia_file.txt", "w")
write(fo, contents)
close(fo)
fi=open("julia_file.txt", "r")
for line in readlines(fi)
line = rstrip(line)
size = length(line)
println(size)
end
close(fi)
8 5 8 13
fi=open("julia_file.txt", "r")
for line in readlines(fi)
println(length(rstrip(line)))
end
close(fi)
8 5 8 13
al=readlines(open("julia_file.txt", "r"))
4-element Array{Any,1}: "Here are\n" "a few\n" "lines of\n" "text content."
t=readall(open("julia_file.txt", "r"))
"Here are\na few\nlines of\ntext content."
t
"Here are\na few\nlines of\ntext content."
w=readdlm(open("julia_file.txt", "r"), ' ')[1] #first word
"Here"
fi=open("julia_file.txt2", "w")
writedlm(fi, ["One","Two","Three"], ' ')
close(fi)
help(seek)
Loading help data... Base.seek(s, pos) Seek a stream to the given position.
fi=open("julia_file.txt", "r")
ba=readbytes(fi, 4096)
ba'
1x37 Array{Uint8,2}: 0x48 0x65 0x72 0x65 0x20 0x61 … 0x6e 0x74 0x65 0x6e 0x74 0x2e
seek(fi,12) #seek to byte 12
println("I'm $(position(fi)) bytes from the start of the file")
I'm 12 bytes from the start of the file
seekstart(fi) #seek to start
seekend(fi) #seek to end
IOStream(<file julia_file.txt>)
seekend(fi)
skip(fi, -2) #relative seek
position(fi)
35
position(fi)
35
# NOT IMPLEMENTED:
# pos = os.lseek(myfile.fileno(),0,1) #?? what does this do?
#not implemented
open("julia_file.txt", "r") do fi
lines= readlines(fi)
end
length(lines)
WARNING:
lines not defined at In[17]:4
t=readall(open("julia_file.txt", "r"))
backtraces on your platform are often misleading or partially incorrect
"Here are\na few\nlines of\ntext content."
para_count = length(split(t, "in"))
2
#simple word count
words=split(t)
8-element Array{String,1}: "Here" "are" "a" "few" "lines" "of" "text" "content."
word_dict=Dict()
for w in words
word_dict[w] = get(word_dict, w, 0)+1
end
word_dict
{"text"=>1,"content."=>1,"are"=>1,"few"=>1,"Here"=>1,"lines"=>1,"of"=>1,"a"=>1}
using TextAnalysis
tokens(Document(t))
8-element Array{UTF8String,1}: "Here" "are" "a" "few" "lines" "of" "text" "content."
words=split(remove_punctuation!(Document(t))) #we could remove numbers too.
8-element Array{String,1}: "Here" "are" "a" "few" "lines" "of" "text" "content"
word_dict=Dict()
for w in words
word_dict[w] = get(word_dict, w, 0)+1
end
word_dict
{"text"=>1,"are"=>1,"few"=>1,"Here"=>1,"lines"=>1,"content"=>1,"of"=>1,"a"=>1}
#line frequency count
lines=readlines(open("julia_file.txt", "r"))
line_dict=Dict()
for w in lines
line_dict[w] = get(line_dict, w, 0)+1
end
line_dict
{"lines of\n"=>1,"Here are\n"=>1,"a few\n"=>1,"text content."=>1}
lines= reverse( readlines(open("julia_file.txt", "r")) )
4-element Array{Any,1}: "text content." "lines of\n" "a few\n" "Here are\n"
fi=open("julia_file.txt", "r")
seekend(fi)
endpos = position(fi)
37
i=1
while i<3 #or while true
sleep(1)
seekend(fi)
if position(fi)>endpos
endpos=position(fi)
println("time: $i. new size: $endpos")
end
i=i+1
end
close(fi)
lines= reverse( readlines(open("julia_file.txt", "r")) )
length(lines)
4
pick = rand(1:length(lines))
lines[pick]
"Here are\n"
using Distributions
shuffle(lines)
4-element Array{Any,1}: "a few\n" "text content." "Here are\n" "lines of\n"
DESIRED_LINE=3
lines[DESIRED_LINE]
"a few\n"
pattern=" "
record = lines[1]
split(record)
2-element Array{String,1}: "text" "content."
#create test file
#make a file
contents="""Here are
a few
lines of
text content."""
fo=open("julia_file.txt", "w")
write(fo, contents)
close(fo)
fi=open("julia_file.txt", "r+")
pos=0
prev_pos=0
for ln in eachline(fi)
prev_pos = pos
pos = position(fi)
end
close(fi)
println(prev_pos)
Warning: could not import Base.foldl into NumericExtensions
24
Warning: could not import Base.foldr into NumericExtensions
cp("julia_file.txt", "julia_file2.txt")
open("julia_file2.txt", "w") do fi
truncate(fi, prev_pos)
end
trunc8 = readall(open("julia_file.txt", "r"))
open("julia_file2.txt", "w") do fo
write(fo, trunc8[1:prev_pos])
end
result = readall(open("julia_file2.txt", "r"))
result
"Here are\na few\nlines of\n"
open("julia_file.txt", "r") do fi
ba=readbytes(fi)
end
ba'
1x37 Array{Uint8,2}: 0x48 0x65 0x72 0x65 0x20 0x61 … 0x6e 0x74 0x65 0x6e 0x74 0x2e
function readstring(stream, numchars)
bytes=readbytes(stream, numchars)
return join([char(v) for v in bytes])
end
readstring (generic function with 1 method)
#make a file : 2 fields of 4 chars (+ \n) = 9 characters per line
contents=""" a b
blah at
line of
text1234"""
open("julia_fixed.dat", "w") do fo
write(fo, contents)
end
35
recsize=8+1 # 8 characters of data + line ending
recno=2
address = recsize * recno
open("julia_fixed.dat", "r") do fi
seek(fi,address)
println(readstring(fi, recsize))
end
line of
open("julia_fixed.dat", "r+") do fi
seek(fi,address)
recstr = readstring(fi, recsize)
newrec = uppercase(recstr)
seek(fi,address)
write(fi,newrec)
end
9
open("julia_fixed.dat", "r") do fi
dt=readall(fi)
print(dt)
end
a b blah at LINE OF text1234
#NOT IMPLEMENTED
Pkg.add("IniFile")
INFO: No packages to install, update or remove. INFO: REQUIRE updated.
# define a packable binary record
using StrPack
@struct type TstStr
int1::Int64
float1::Float64
end
RECORDSIZE=sizeof(TstStr)
16
#write out sample data
rec=TstStr(4455, 556.32)
open("bintest.dat","w") do fo
pack(fo, rec)
pack(fo, TstStr(3455, 556.32))
pack(fo, TstStr(6453, 656.32))
end
WARNING:
max(x) is deprecated, use maximum(x) instead. in depwarn at deprecated.jl:29 in string at ascii.jl:35 WARNING: max(x) is deprecated, use maximum(x) instead. in depwarn at deprecated.jl:29 in string at ascii.jl:35 WARNING: max(x) is deprecated, use maximum(x) instead. in depwarn at deprecated.jl:29 in string at ascii.jl:35
16
open("bintest.dat","r") do fi
seek(fi, RECORDSIZE) # "rewind" to the beginning of the buffer
s2 = unpack(fi, TstStr)
println(s2)
end
WARNING:
TstStr(3455,556.32)
max(x) is deprecated, use maximum(x) instead. in depwarn at deprecated.jl:29 in string at ascii.jl:35
using IniFile
ini = Inifile()
read(ini, "test.ini")
get(ini, "section 1", "strname1") #== "section1name1"
"section1name1"
#Will not implement
#Will not implement