Skip to content
New issue

Have a question about this project? # for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “#”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? # to your account

RFC: Updates to IO, IOString #1424

Merged
merged 3 commits into from
Oct 23, 2012
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
284 changes: 178 additions & 106 deletions base/io.jl
Original file line number Diff line number Diff line change
Expand Up @@ -2,6 +2,182 @@

abstract IO

# Generic IO functions

## byte-order mark, ntoh & hton ##

const ENDIAN_BOM = reinterpret(Uint32,uint8([1:4]))[1]

if ENDIAN_BOM == 0x01020304
ntoh(x) = identity(x)
hton(x) = identity(x)
ltoh(x) = bswap(x)
htol(x) = bswap(x)
elseif ENDIAN_BOM == 0x04030201
ntoh(x) = bswap(x)
hton(x) = bswap(x)
ltoh(x) = identity(x)
htol(x) = identity(x)
else
error("seriously? what is this machine?")
end

## binary I/O ##

# all subtypes should implement this
write(s::IO, x::Uint8) = error(typeof(s)," does not support byte I/O")

if ENDIAN_BOM == 0x01020304
function write(s, x::Integer)
for n = sizeof(x):-1:1
write(s, uint8((x>>>((n-1)<<3))))
end
end
else
function write(s, x::Integer)
for n = 1:sizeof(x)
write(s, uint8((x>>>((n-1)<<3))))
end
end
end

write(s::IO, x::Bool) = write(s, uint8(x))
write(s::IO, x::Float32) = write(s, box(Int32,unbox(Float32,x)))
write(s::IO, x::Float64) = write(s, box(Int64,unbox(Float64,x)))

function write(s::IO, a::AbstractArray)
for i = 1:numel(a)
write(s, a[i])
end
end

function write(s::IO, c::Char)
if c < 0x80
write(s, uint8(c))
return 1
elseif c < 0x800
write(s, uint8(( c >> 6 ) | 0xC0))
write(s, uint8(( c & 0x3F ) | 0x80))
return 2
elseif c < 0x10000
write(s, uint8(( c >> 12 ) | 0xE0))
write(s, uint8(((c >> 6) & 0x3F ) | 0x80))
write(s, uint8(( c & 0x3F ) | 0x80))
return 3
elseif c < 0x110000
write(s, uint8(( c >> 18 ) | 0xF0))
write(s, uint8(((c >> 12) & 0x3F ) | 0x80))
write(s, uint8(((c >> 6) & 0x3F ) | 0x80))
write(s, uint8(( c & 0x3F ) | 0x80))
return 4
end
error("invalid Unicode code point: U+", hex(c))
end

# all subtypes should implement this
read(s::IO, x::Type{Uint8}) = error(typeof(s)," does not support byte I/O")

function read{T <: Integer}(s::IO, ::Type{T})
x = zero(T)
for n = 1:sizeof(x)
x |= (convert(T,read(s,Uint8))<<((n-1)<<3))
end
return x
end

read(s::IO, ::Type{Bool}) = (read(s,Uint8)!=0)
read(s::IO, ::Type{Float32}) = box(Float32,unbox(Int32,read(s,Int32)))
read(s::IO, ::Type{Float64}) = box(Float64,unbox(Int64,read(s,Int64)))

read{T}(s::IO, t::Type{T}, d1::Int, dims::Int...) =
read(s, t, tuple(d1,dims...))
read{T}(s::IO, t::Type{T}, d1::Integer, dims::Integer...) =
read(s, t, map(int,tuple(d1,dims...)))

read{T}(s::IO, ::Type{T}, dims::Dims) = read(s, Array(T, dims))

function read{T}(s::IO, a::Array{T})
for i = 1:numel(a)
a[i] = read(s, T)
end
return a
end

function read(s::IO, ::Type{Char})
ch = read(s, Uint8)
if ch < 0x80
return char(ch)
end

# mimic utf8.next function
trailing = Base._jl_utf8_trailing[ch+1]
c = uint32(0)
for j = 1:trailing
c += ch
c <<= 6
ch = read(s, Uint8)
end
c += ch
c -= Base._jl_utf8_offset[trailing+1]
char(c)
end

function readuntil(s::IO, delim)
out = memio()
while (!eof(s))
c = read(s, Char)
write(out, c)
if c == delim
break
end
end
takebuf_string(out)
end

readline(s::IO) = readuntil(s, '\n')

function readall(s::IO)
out = memio()
while (!eof(s))
c = read(s, Char)
write(out, c)
end
takebuf_string(out)
end

readchomp(x) = chomp(readall(x))

## high-level iterator interfaces ##

type EachLine
stream::IO
end
each_line(stream::IO) = EachLine(stream)

start(itr::EachLine) = readline(itr.stream)
function done(itr::EachLine, line)
if !isempty(line)
return false
end
close(itr.stream)
true
end
next(itr::EachLine, this_line) = (this_line, readline(itr.stream))

function readlines(s, fx::Function...)
a = {}
for l = each_line(s)
for f in fx
l = f(l)
end
push(a, l)
end
return a
end


## IOStream

const sizeof_off_t = int(ccall(:jl_sizeof_off_t, Int32, ()))
const sizeof_ios_t = int(ccall(:jl_sizeof_ios_t, Int32, ()))

Expand Down Expand Up @@ -118,80 +294,6 @@ end
memio(x::Integer) = memio(x, true)
memio() = memio(0, true)

## byte-order mark, ntoh & hton ##

const ENDIAN_BOM = reinterpret(Uint32,uint8([1:4]))[1]

if ENDIAN_BOM == 0x01020304
ntoh(x) = identity(x)
hton(x) = identity(x)
ltoh(x) = bswap(x)
htol(x) = bswap(x)
elseif ENDIAN_BOM == 0x04030201
ntoh(x) = bswap(x)
hton(x) = bswap(x)
ltoh(x) = identity(x)
htol(x) = identity(x)
else
error("seriously? what is this machine?")
end

## binary I/O ##
write(x) = write(OUTPUT_STREAM::IOStream, x)
write(s, x::Uint8) = error(typeof(s)," does not support byte I/O")

if ENDIAN_BOM == 0x01020304
function write(s, x::Integer)
for n = sizeof(x):-1:1
write(s, uint8((x>>>((n-1)<<3))))
end
end
else
function write(s, x::Integer)
for n = 1:sizeof(x)
write(s, uint8((x>>>((n-1)<<3))))
end
end
end

write(s, x::Bool) = write(s, uint8(x))
write(s, x::Float32) = write(s, box(Int32,unbox(Float32,x)))
write(s, x::Float64) = write(s, box(Int64,unbox(Float64,x)))

function write(s, a::AbstractArray)
for i = 1:numel(a)
write(s, a[i])
end
end

read(s, x::Type{Uint8}) = error(typeof(s)," does not support byte I/O")

function read{T <: Integer}(s, ::Type{T})
x = zero(T)
for n = 1:sizeof(x)
x |= (convert(T,read(s,Uint8))<<((n-1)<<3))
end
return x
end

read(s, ::Type{Bool}) = (read(s,Uint8)!=0)
read(s, ::Type{Float32}) = box(Float32,unbox(Int32,read(s,Int32)))
read(s, ::Type{Float64}) = box(Float64,unbox(Int64,read(s,Int64)))

read{T}(s, t::Type{T}, d1::Int, dims::Int...) =
read(s, t, tuple(d1,dims...))
read{T}(s, t::Type{T}, d1::Integer, dims::Integer...) =
read(s, t, map(int,tuple(d1,dims...)))

read{T}(s, ::Type{T}, dims::Dims) = read(s, Array(T, dims))

function read{T}(s, a::Array{T})
for i = 1:numel(a)
a[i] = read(s, T)
end
return a
end

## low-level calls ##

write(s::IOStream, b::Uint8) = ccall(:ios_putc, Int32, (Int32, Ptr{Void}), b, s.ios)
Expand Down Expand Up @@ -294,6 +396,8 @@ function with_output_to_string(thunk)
takebuf_string(m)
end

write(x) = write(OUTPUT_STREAM::IOStream, x)

function readuntil(s::IOStream, delim)
# TODO: faster versions that avoid the encoding check
ccall(:jl_readuntil, ByteString, (Ptr{Void}, Uint8), s.ios, delim)
Expand All @@ -306,38 +410,6 @@ function readall(s::IOStream)
end
readall(filename::String) = open(readall, filename)

readchomp(x) = chomp(readall(x))

readline(s::IOStream) = readuntil(s, '\n')

## high-level iterator interfaces ##

type EachLine
stream::IOStream
end
each_line(stream::IOStream) = EachLine(stream)

start(itr::EachLine) = readline(itr.stream)
function done(itr::EachLine, line)
if !isempty(line)
return false
end
close(itr.stream)
true
end
next(itr::EachLine, this_line) = (this_line, readline(itr.stream))

function readlines(s, fx::Function...)
a = {}
for l = each_line(s)
for f in fx
l = f(l)
end
push(a, l)
end
return a
end

## select interface ##

const sizeof_fd_set = int(ccall(:jl_sizeof_fd_set, Int32, ()))
Expand Down
7 changes: 7 additions & 0 deletions extras/iostring.jl
Original file line number Diff line number Diff line change
Expand Up @@ -36,6 +36,13 @@ read{T}(from::IOString, ::Type{Ptr{T}}) = convert(Ptr{T}, read(from, Uint))

skip(io::IOString, n::Integer) = io.ptr += n
seek(io::IOString, n::Integer) = io.ptr = n+1
seek_end(io::IOString) = io.ptr = length(io.data)+1
position(io::IOString) = io.ptr-1
truncate(io::IOString, n::Integer) = (grow(io.data, n-length(io.data)); ptr = min(ptr, n+1); uint(0))
eof(io::IOString) = io.ptr-1 == length(io.data)
close(io::IOString) = (grow(io.data, 0); ptr = 1; nothing)

bytestring(io::IOString) = bytestring(io.data)

function write{T}(to::IOString, a::Array{T})
if isa(T, BitsKind)
Expand Down