third_party_rust_serde/de.rs
2014-05-19 18:44:20 -07:00

867 lines
25 KiB
Rust

#![feature(macro_rules)]
extern crate collections;
use std::hash::Hash;
use std::num;
use std::result;
use collections::HashMap;
#[deriving(Clone, Eq)]
pub enum Token {
Null,
Bool(bool),
Int(int),
I8(i8),
I16(i16),
I32(i32),
I64(i64),
Uint(uint),
U8(u8),
U16(u16),
U32(u32),
U64(u64),
F32(f32),
F64(f64),
Char(char),
Str(&'static str),
StrBuf(StrBuf),
CollectionStart(uint),
CollectionEnd,
}
macro_rules! decode_primitive {
($( $Variant:pat => $E:expr ),+) => {
match token {
$( $Variant => $E ),+,
_ => Err(self.syntax_error()),
}
}
}
macro_rules! to_result {
($expr:expr, $err:expr) => {
match $expr {
Some(value) => Ok(value),
None => Err($err),
}
}
}
pub trait Deserializer<E>: Iterator<Result<Token, E>> {
fn end_of_stream_error(&self) -> E;
fn syntax_error(&self) -> E;
#[inline]
fn expect_token(&mut self) -> Result<Token, E> {
match self.next() {
Some(Ok(token)) => Ok(token),
Some(Err(err)) => Err(err),
None => Err(self.end_of_stream_error()),
}
}
#[inline]
fn expect_null(&mut self) -> Result<(), E> {
let token = try!(self.expect_token());
self.expect_null_token(token)
}
#[inline]
fn expect_null_token(&mut self, token: Token) -> Result<(), E> {
decode_primitive!(
Null => Ok(()),
CollectionStart(_) => {
self.expect_collection_end()
}
)
}
#[inline]
fn expect_bool(&mut self) -> Result<bool, E> {
let token = try!(self.expect_token());
self.expect_bool_token(token)
}
#[inline]
fn expect_bool_token(&mut self, token: Token) -> Result<bool, E> {
decode_primitive!(Bool(value) => Ok(value))
}
#[inline]
fn expect_num<T: NumCast>(&mut self) -> Result<T, E> {
let token = try!(self.expect_token());
self.expect_num_token(token)
}
#[inline]
fn expect_num_token<T: NumCast>(&mut self, token: Token) -> Result<T, E> {
match token {
Int(x) => to_result!(num::cast(x), self.syntax_error()),
I8(x) => to_result!(num::cast(x), self.syntax_error()),
I16(x) => to_result!(num::cast(x), self.syntax_error()),
I32(x) => to_result!(num::cast(x), self.syntax_error()),
I64(x) => to_result!(num::cast(x), self.syntax_error()),
Uint(x) => to_result!(num::cast(x), self.syntax_error()),
U8(x) => to_result!(num::cast(x), self.syntax_error()),
U16(x) => to_result!(num::cast(x), self.syntax_error()),
U32(x) => to_result!(num::cast(x), self.syntax_error()),
U64(x) => to_result!(num::cast(x), self.syntax_error()),
F32(x) => to_result!(num::cast(x), self.syntax_error()),
F64(x) => to_result!(num::cast(x), self.syntax_error()),
_ => Err(self.syntax_error()),
}
}
#[inline]
fn expect_char(&mut self) -> Result<char, E> {
let token = try!(self.expect_token());
self.expect_char_token(token)
}
#[inline]
fn expect_char_token(&mut self, token: Token) -> Result<char, E> {
decode_primitive!(Char(value) => Ok(value))
}
#[inline]
fn expect_str(&mut self) -> Result<&'static str, E> {
let token = try!(self.expect_token());
self.expect_str_token(token)
}
#[inline]
fn expect_str_token(&mut self, token: Token) -> Result<&'static str, E> {
decode_primitive!(Str(value) => Ok(value))
}
#[inline]
fn expect_strbuf(&mut self) -> Result<StrBuf, E> {
let token = try!(self.expect_token());
self.expect_strbuf_token(token)
}
#[inline]
fn expect_strbuf_token(&mut self, token: Token) -> Result<StrBuf, E> {
decode_primitive!(
Str(value) => Ok(value.to_strbuf()),
StrBuf(value) => Ok(value)
)
}
#[inline]
fn expect_option<
T: Deserializable<E, Self>
>(&mut self) -> Result<Option<T>, E> {
let token = try!(self.expect_token());
self.expect_option_token(token)
}
#[inline]
fn expect_option_token<
T: Deserializable<E, Self>
>(&mut self, token: Token) -> Result<Option<T>, E> {
match token {
Null => Ok(None),
token => {
let value: T = try!(Deserializable::deserialize_token(self, token));
Ok(Some(value))
}
}
}
#[inline]
fn expect_collection<
T: Deserializable<E, Self>,
C: FromIterator<T>
>(&mut self) -> Result<C, E> {
let token = try!(self.expect_token());
self.expect_collection_token(token)
}
#[inline]
fn expect_collection_token<
T: Deserializable<E, Self>,
C: FromIterator<T>
>(&mut self, token: Token) -> Result<C, E> {
let len = try!(self.expect_collection_start_token(token));
let iter = self.by_ref().batch(|d| {
let d = d.iter();
let token = match d.next() {
Some(token) => token,
None => { return None; }
};
match token {
Ok(CollectionEnd) => {
None
}
Ok(token) => {
let value: Result<T, E> = Deserializable::deserialize_token(d, token);
Some(value)
}
Err(e) => {
Some(Err(e))
}
}
});
result::collect_with_capacity(iter, len)
}
#[inline]
fn expect_collection_start(&mut self) -> Result<uint, E> {
let token = try!(self.expect_token());
self.expect_collection_start_token(token)
}
#[inline]
fn expect_collection_start_token(&mut self, token: Token) -> Result<uint, E> {
match token {
CollectionStart(len) => Ok(len),
_ => Err(self.syntax_error()),
}
}
#[inline]
fn expect_collection_end(&mut self) -> Result<(), E> {
let token = try!(self.expect_token());
self.expect_collection_end_token(token)
}
#[inline]
fn expect_collection_end_token(&mut self, token: Token) -> Result<(), E> {
match token {
CollectionEnd => Ok(()),
_ => Err(self.syntax_error()),
}
}
}
//////////////////////////////////////////////////////////////////////////////
pub trait Deserializable<E, D: Deserializer<E>> {
fn deserialize(d: &mut D) -> Result<Self, E>;
fn deserialize_token(d: &mut D, token: Token) -> Result<Self, E>;
}
//////////////////////////////////////////////////////////////////////////////
macro_rules! impl_deserializable {
($ty:ty, $method:ident, $method_token:ident) => {
impl<
E,
D: Deserializer<E>
> Deserializable<E, D> for $ty {
#[inline]
fn deserialize(d: &mut D) -> Result<$ty, E> {
d.$method()
}
#[inline]
fn deserialize_token(d: &mut D, token: Token) -> Result<$ty, E> {
d.$method_token(token)
}
}
}
}
impl_deserializable!(bool, expect_bool, expect_bool_token)
impl_deserializable!(int, expect_num, expect_num_token)
impl_deserializable!(i8, expect_num, expect_num_token)
impl_deserializable!(i16, expect_num, expect_num_token)
impl_deserializable!(i32, expect_num, expect_num_token)
impl_deserializable!(i64, expect_num, expect_num_token)
impl_deserializable!(uint, expect_num, expect_num_token)
impl_deserializable!(u8, expect_num, expect_num_token)
impl_deserializable!(u16, expect_num, expect_num_token)
impl_deserializable!(u32, expect_num, expect_num_token)
impl_deserializable!(u64, expect_num, expect_num_token)
impl_deserializable!(f32, expect_num, expect_num_token)
impl_deserializable!(f64, expect_num, expect_num_token)
impl_deserializable!(char, expect_char, expect_char_token)
impl_deserializable!(&'static str, expect_str, expect_str_token)
impl_deserializable!(StrBuf, expect_strbuf, expect_strbuf_token)
//////////////////////////////////////////////////////////////////////////////
impl<
E,
D: Deserializer<E>,
T: Deserializable<E, D>
> Deserializable<E, D> for Option<T> {
#[inline]
fn deserialize(d: &mut D) -> Result<Option<T>, E> {
d.expect_option()
}
#[inline]
fn deserialize_token(d: &mut D, token: Token) -> Result<Option<T>, E> {
d.expect_option_token(token)
}
}
//////////////////////////////////////////////////////////////////////////////
impl<
E,
D: Deserializer<E>,
T: Deserializable<E, D>
> Deserializable<E, D> for Vec<T> {
#[inline]
fn deserialize(d: &mut D) -> Result<Vec<T>, E> {
d.expect_collection()
}
#[inline]
fn deserialize_token(d: &mut D, token: Token) -> Result<Vec<T>, E> {
d.expect_collection_token(token)
}
}
impl<
E,
D: Deserializer<E>,
K: Deserializable<E, D> + TotalEq + Hash,
V: Deserializable<E, D>
> Deserializable<E, D> for HashMap<K, V> {
#[inline]
fn deserialize(d: &mut D) -> Result<HashMap<K, V>, E> {
d.expect_collection()
}
#[inline]
fn deserialize_token(d: &mut D, token: Token) -> Result<HashMap<K, V>, E> {
d.expect_collection_token(token)
}
}
//////////////////////////////////////////////////////////////////////////////
impl<
E,
D: Deserializer<E>
> Deserializable<E, D> for () {
#[inline]
fn deserialize(d: &mut D) -> Result<(), E> {
d.expect_null()
}
#[inline]
fn deserialize_token(d: &mut D, token: Token) -> Result<(), E> {
d.expect_null_token(token)
}
}
//////////////////////////////////////////////////////////////////////////////
macro_rules! peel(($name:ident, $($other:ident,)*) => (deserialize_tuple!($($other,)*)))
macro_rules! deserialize_tuple (
() => ();
( $($name:ident,)+ ) => (
impl<
E,
D: Deserializer<E>,
$($name:Deserializable<E, D>),*
> Deserializable<E, D> for ($($name,)*) {
#[inline]
#[allow(uppercase_variables)]
fn deserialize(d: &mut D) -> Result<($($name,)*), E> {
try!(d.expect_collection_start());
let result = ($(
{
let $name = try!(Deserializable::deserialize(d));
$name
}
,)*);
try!(d.expect_collection_end());
Ok(result)
}
#[inline]
#[allow(uppercase_variables)]
fn deserialize_token(d: &mut D, token: Token) -> Result<($($name,)*), E> {
try!(d.expect_collection_start_token(token));
let result = ($(
{
let $name = try!(Deserializable::deserialize(d));
$name
}
,)*);
try!(d.expect_collection_end());
Ok(result)
}
}
peel!($($name,)*)
)
)
deserialize_tuple! { T0, T1, T2, T3, T4, T5, T6, T7, T8, T9, T10, T11, }
//////////////////////////////////////////////////////////////////////////////
#[cfg(test)]
mod tests {
extern crate serialize;
use std::vec;
use collections::HashMap;
use test::Bencher;
use self::serialize::{Decoder, Decodable};
use super::{Token, Int, StrBuf, CollectionStart, CollectionEnd};
use super::{Deserializer, Deserializable};
//////////////////////////////////////////////////////////////////////////////
#[deriving(Show)]
enum Error {
EndOfStream,
SyntaxError,
}
//////////////////////////////////////////////////////////////////////////////
struct TokenDeserializer {
tokens: Vec<Token>,
}
impl TokenDeserializer {
#[inline]
fn new(tokens: Vec<Token>) -> TokenDeserializer {
TokenDeserializer {
tokens: tokens,
}
}
}
impl Iterator<Result<Token, Error>> for TokenDeserializer {
#[inline]
fn next(&mut self) -> Option<Result<Token, Error>> {
match self.tokens.shift() {
None => None,
Some(token) => Some(Ok(token)),
}
}
}
impl Deserializer<Error> for TokenDeserializer {
#[inline]
fn end_of_stream_error(&self) -> Error {
EndOfStream
}
#[inline]
fn syntax_error(&self) -> Error {
SyntaxError
}
}
//////////////////////////////////////////////////////////////////////////////
#[deriving(Eq, Show)]
enum IntsDeserializerState {
Start,
Sep,
//Value,
End,
}
struct IntsDeserializer {
state: IntsDeserializerState,
len: uint,
iter: vec::MoveItems<int>,
value: Option<int>
}
impl IntsDeserializer {
#[inline]
fn new(values: Vec<int>) -> IntsDeserializer {
IntsDeserializer {
state: Start,
len: values.len(),
iter: values.move_iter(),
value: None,
}
}
}
impl Iterator<Result<Token, Error>> for IntsDeserializer {
#[inline]
fn next(&mut self) -> Option<Result<Token, Error>> {
match self.state {
Start => {
self.state = Sep;
Some(Ok(CollectionStart(self.len)))
}
Sep => {
match self.iter.next() {
Some(value) => {
self.state = Sep;
self.value = Some(value);
Some(Ok(Int(value)))
}
None => {
self.state = End;
Some(Ok(CollectionEnd))
}
}
}
/*
Value => {
self.state = Sep;
match self.value.take() {
Some(value) => Some(Ok(Int(value))),
None => Some(Err(self.end_of_stream_error())),
}
}
*/
End => {
None
}
}
}
}
impl Deserializer<Error> for IntsDeserializer {
#[inline]
fn end_of_stream_error(&self) -> Error {
EndOfStream
}
#[inline]
fn syntax_error(&self) -> Error {
SyntaxError
}
/*
#[inline]
fn expect_int(&mut self, token: Token) -> Result<int, Error> {
assert_eq!(self.state, Value);
self.state = Sep;
match self.value.take() {
Some(value) => Ok(value),
None => Err(self.end_of_stream_error()),
}
}
*/
}
struct IntsDecoder {
iter: vec::MoveItems<int>,
}
impl IntsDecoder {
#[inline]
fn new(values: Vec<int>) -> IntsDecoder {
IntsDecoder {
iter: values.move_iter()
}
}
}
impl Decoder<Error> for IntsDecoder {
// Primitive types:
fn read_nil(&mut self) -> Result<(), Error> { Err(SyntaxError) }
fn read_uint(&mut self) -> Result<uint, Error> { Err(SyntaxError) }
fn read_u64(&mut self) -> Result<u64, Error> { Err(SyntaxError) }
fn read_u32(&mut self) -> Result<u32, Error> { Err(SyntaxError) }
fn read_u16(&mut self) -> Result<u16, Error> { Err(SyntaxError) }
fn read_u8(&mut self) -> Result<u8, Error> { Err(SyntaxError) }
#[inline]
fn read_int(&mut self) -> Result<int, Error> {
match self.iter.next() {
Some(value) => Ok(value),
None => Err(EndOfStream),
}
}
fn read_i64(&mut self) -> Result<i64, Error> { Err(SyntaxError) }
fn read_i32(&mut self) -> Result<i32, Error> { Err(SyntaxError) }
fn read_i16(&mut self) -> Result<i16, Error> { Err(SyntaxError) }
fn read_i8(&mut self) -> Result<i8, Error> { Err(SyntaxError) }
fn read_bool(&mut self) -> Result<bool, Error> { Err(SyntaxError) }
fn read_f64(&mut self) -> Result<f64, Error> { Err(SyntaxError) }
fn read_f32(&mut self) -> Result<f32, Error> { Err(SyntaxError) }
fn read_char(&mut self) -> Result<char, Error> { Err(SyntaxError) }
fn read_str(&mut self) -> Result<StrBuf, Error> { Err(SyntaxError) }
// Compound types:
fn read_enum<T>(&mut self, _name: &str, _f: |&mut IntsDecoder| -> Result<T, Error>) -> Result<T, Error> { Err(SyntaxError) }
fn read_enum_variant<T>(&mut self,
_names: &[&str],
_f: |&mut IntsDecoder, uint| -> Result<T, Error>)
-> Result<T, Error> { Err(SyntaxError) }
fn read_enum_variant_arg<T>(&mut self,
_a_idx: uint,
_f: |&mut IntsDecoder| -> Result<T, Error>)
-> Result<T, Error> { Err(SyntaxError) }
fn read_enum_struct_variant<T>(&mut self,
_names: &[&str],
_f: |&mut IntsDecoder, uint| -> Result<T, Error>)
-> Result<T, Error> { Err(SyntaxError) }
fn read_enum_struct_variant_field<T>(&mut self,
_f_name: &str,
_f_idx: uint,
_f: |&mut IntsDecoder| -> Result<T, Error>)
-> Result<T, Error> { Err(SyntaxError) }
fn read_struct<T>(&mut self, _s_name: &str, _len: uint, _f: |&mut IntsDecoder| -> Result<T, Error>)
-> Result<T, Error> { Err(SyntaxError) }
fn read_struct_field<T>(&mut self,
_f_name: &str,
_f_idx: uint,
_f: |&mut IntsDecoder| -> Result<T, Error>)
-> Result<T, Error> { Err(SyntaxError) }
fn read_tuple<T>(&mut self, _f: |&mut IntsDecoder, uint| -> Result<T, Error>) -> Result<T, Error> { Err(SyntaxError) }
fn read_tuple_arg<T>(&mut self, _a_idx: uint, _f: |&mut IntsDecoder| -> Result<T, Error>) -> Result<T, Error> { Err(SyntaxError) }
fn read_tuple_struct<T>(&mut self,
_s_name: &str,
_f: |&mut IntsDecoder, uint| -> Result<T, Error>)
-> Result<T, Error> { Err(SyntaxError) }
fn read_tuple_struct_arg<T>(&mut self,
_a_idx: uint,
_f: |&mut IntsDecoder| -> Result<T, Error>)
-> Result<T, Error> { Err(SyntaxError) }
// Specialized types:
fn read_option<T>(&mut self, _f: |&mut IntsDecoder, bool| -> Result<T, Error>) -> Result<T, Error> { Err(SyntaxError) }
#[inline]
fn read_seq<T>(&mut self, f: |&mut IntsDecoder, uint| -> Result<T, Error>) -> Result<T, Error> {
f(self, 3)
}
#[inline]
fn read_seq_elt<T>(&mut self, _idx: uint, f: |&mut IntsDecoder| -> Result<T, Error>) -> Result<T, Error> {
f(self)
}
fn read_map<T>(&mut self, _f: |&mut IntsDecoder, uint| -> Result<T, Error>) -> Result<T, Error> { Err(SyntaxError) }
fn read_map_elt_key<T>(&mut self, _idx: uint, _f: |&mut IntsDecoder| -> Result<T, Error>) -> Result<T, Error> { Err(SyntaxError) }
fn read_map_elt_val<T>(&mut self, _idx: uint, _f: |&mut IntsDecoder| -> Result<T, Error>) -> Result<T, Error> { Err(SyntaxError) }
}
#[test]
fn test_tokens_int() {
let tokens = vec!(
Int(5),
);
let mut deserializer = TokenDeserializer::new(tokens);
let value: Result<int, Error> = Deserializable::deserialize(&mut deserializer);
assert_eq!(value.unwrap(), 5);
}
#[test]
fn test_tokens_strbuf() {
let tokens = vec!(
StrBuf("a".to_strbuf()),
);
let mut deserializer = TokenDeserializer::new(tokens);
let value: Result<StrBuf, Error> = Deserializable::deserialize(&mut deserializer);
assert_eq!(value.unwrap(), "a".to_strbuf());
}
#[test]
fn test_tokens_tuple_empty() {
let tokens = vec!(
CollectionStart(0),
CollectionEnd,
);
let mut deserializer = TokenDeserializer::new(tokens);
let value: Result<(), Error> = Deserializable::deserialize(&mut deserializer);
assert_eq!(value.unwrap(), ());
}
#[test]
fn test_tokens_tuple() {
let tokens = vec!(
CollectionStart(2),
Int(5),
StrBuf("a".to_strbuf()),
CollectionEnd,
);
let mut deserializer = TokenDeserializer::new(tokens);
let value: Result<(int, StrBuf), Error> = Deserializable::deserialize(&mut deserializer);
assert_eq!(value.unwrap(), (5, "a".to_strbuf()));
}
#[test]
fn test_tokens_tuple_compound() {
let tokens = vec!(
CollectionStart(2),
CollectionStart(0),
CollectionEnd,
CollectionStart(2),
Int(5),
StrBuf("a".to_strbuf()),
CollectionEnd,
CollectionEnd,
);
let mut deserializer = TokenDeserializer::new(tokens);
let value: Result<((), (int, StrBuf)), Error> = Deserializable::deserialize(&mut deserializer);
assert_eq!(value.unwrap(), ((), (5, "a".to_strbuf())));
}
#[test]
fn test_tokens_vec_empty() {
let tokens = vec!(
CollectionStart(0),
CollectionEnd,
);
let mut deserializer = TokenDeserializer::new(tokens);
let value: Result<Vec<int>, Error> = Deserializable::deserialize(&mut deserializer);
assert_eq!(value.unwrap(), vec!());
}
#[test]
fn test_tokens_vec() {
let tokens = vec!(
CollectionStart(3),
Int(5),
Int(6),
Int(7),
CollectionEnd,
);
let mut deserializer = TokenDeserializer::new(tokens);
let value: Result<Vec<int>, Error> = Deserializable::deserialize(&mut deserializer);
assert_eq!(value.unwrap(), vec!(5, 6, 7));
}
#[test]
fn test_tokens_vec_compound() {
let tokens = vec!(
CollectionStart(0),
CollectionStart(1),
Int(1),
CollectionEnd,
CollectionStart(2),
Int(2),
Int(3),
CollectionEnd,
CollectionStart(3),
Int(4),
Int(5),
Int(6),
CollectionEnd,
CollectionEnd,
);
let mut deserializer = TokenDeserializer::new(tokens);
let value: Result<Vec<Vec<int>>, Error> = Deserializable::deserialize(&mut deserializer);
assert_eq!(value.unwrap(), vec!(vec!(1), vec!(2, 3), vec!(4, 5, 6)));
}
#[test]
fn test_tokens_hashmap() {
let tokens = vec!(
CollectionStart(2),
CollectionStart(2),
Int(5),
StrBuf("a".to_strbuf()),
CollectionEnd,
CollectionStart(2),
Int(6),
StrBuf("b".to_strbuf()),
CollectionEnd,
CollectionEnd,
);
let mut deserializer = TokenDeserializer::new(tokens);
let value: Result<HashMap<int, StrBuf>, Error> = Deserializable::deserialize(&mut deserializer);
let mut map = HashMap::new();
map.insert(5, "a".to_strbuf());
map.insert(6, "b".to_strbuf());
assert_eq!(value.unwrap(), map);
}
#[bench]
fn bench_dummy_deserializer(b: &mut Bencher) {
b.iter(|| {
let tokens = vec!(
CollectionStart(3),
Int(5),
Int(6),
Int(7),
CollectionEnd,
);
let mut d = TokenDeserializer::new(tokens);
let value: Result<Vec<int>, Error> = Deserializable::deserialize(&mut d);
assert_eq!(value.unwrap(), vec!(5, 6, 7));
})
}
#[bench]
fn bench_ints_deserializer(b: &mut Bencher) {
b.iter(|| {
let ints = vec!(5, 6, 7);
let mut d = IntsDeserializer::new(ints);
let value: Result<Vec<int>, Error> = Deserializable::deserialize(&mut d);
assert_eq!(value.unwrap(), vec!(5, 6, 7));
})
}
#[bench]
fn bench_ints_decoder(b: &mut Bencher) {
b.iter(|| {
let ints = vec!(5, 6, 7);
let mut d = IntsDecoder::new(ints);
let value: Result<Vec<int>, Error> = Decodable::decode(&mut d);
assert_eq!(value.unwrap(), vec!(5, 6, 7));
})
}
}