//! Transform bytes into tokens
use std::str;
use std::rc::Rc;

use nom::{IResult, hex_digit, digit, Needed};
use nom::{AsChar, InputLength, InputIter, Slice, ErrorKind};

use ::token::{Id, Tk, New, Tag, Num, Ws};

pub use nom::IResult as LexResult;

/// Struct that provides the operations to take a slice of bytes and
/// convert them into `Tk` tokens.
#[derive(Debug, Clone, Copy, Serialize)]
pub struct Lexer;


impl Lexer {
    pub fn new() -> Self {
        Lexer {}
    }

    /// Convert a slice of bytes into a `Rc<Vec<Tk>>`
    #[deprecated]
    pub fn tokenize<'a>(&self, bytes: &'a [u8]) -> Rc<LexResult<&'a [u8], Vec<Tk<'a>>>> {
        let result = tokenize_bytes(bytes);
        Rc::new(result)
    }

    /// Convert a slice of bytes into `Vec<Tk<'a>>`
    pub fn tokenize2<'a>(&self, bytes: &'a [u8]) -> LexResult<&'a [u8], Vec<Tk<'a>>>{
        tokenize_bytes(bytes)
    }
}


/// Entry point of the lexer into nom parser
named!(pub tokenize_bytes <Vec<Tk>>, do_parse!(
    tokens: many0!(
        alt_complete!(
            space       |
            endline     |
            number      |
            symbol      |
            operator    |
            string      |
            identifier  |
            error_marker)
                            )>>
    (tokens)
));


named!(number <Tk>, do_parse!(
    tuple : alt_complete!(
            call!(sublex_hex)     => { |r: &'a[u8]| (&r[..], Tag::N(Num::Hex))      } |
            call!(sublex_bin)     => { |r: &'a[u8]| (&r[..], Tag::N(Num::Binary))   } |
            call!(sublex_octal)   => { |r: &'a[u8]| (&r[..], Tag::N(Num::Octal))    } |
            call!(sublex_complex) => { |r: &'a[u8]| (&r[..], Tag::N(Num::Complex))  } |
            call!(sublex_float)   => { |r: &'a[u8]| (&r[..], Tag::N(Num::Float))    } |
            call!(digit)          => { |r: &'a[u8]| (&r[..], Tag::N(Num::Int))      } ) >>
    (Tk::new(Id::Number, tuple.0, tuple.1))
));


/// Called by `number` to parse `"0x"` prefixed hexadecimal integer strings
named!(sublex_hex <&[u8]>, recognize!(preceded!(tag!("0x"), hex_digit)));

/// Called by `number` to parse `"0x"` prefixed binary integer strings
named!(sublex_bin <&[u8]>, recognize!(preceded!(tag!("0b"), many1!(one_of!("01")))));

/// Called by `number` to parse `"0x"` prefixed octal integer strings
named!(sublex_octal <&[u8]>, recognize!(preceded!(tag!("0o"), hex_digit)));

/// Called by `number` to parse floats
named!(sublex_float <&[u8]>, recognize!(delimited!(opt!(digit), tag!("."), digit)));

/// Called by `number` to parse `'j'` suffixed floats as complex numbers
named!(sublex_complex <&[u8]>, recognize!(preceded!(alt!(sublex_float | digit), tag!("j"))));


/// Mark the end of each line since it is the end-of-statement qualifier in python
named!(endline <Tk>, do_parse!(
    nl: tag!("\n") >>
    (Tk::new(Id::Newline,  nl, Tag::W(Ws::Newline)))
));


named!(space <Tk>, do_parse!(
    tk: alt!(
        tag!(" ")  => { |r: &'a[u8]| (Tk::new(Id::Space, r, Tag::None)) } |
        tag!("\t") => { |r: &'a[u8]| (Tk::new(Id::Tab, r, Tag::None))   } ) >>
    (tk)
));


/// Keep chugging along if
named!(error_marker <Tk>, do_parse!(
    content: take!(1) >>
    (Tk::new(Id::ErrorMarker, content, Tag::None))
));


/// Discover if the next `[u8]` bytes are an identifier `Id::Name`. Cross reference
/// the matched bytes with the known keywords with `as_keyword`. If a keyword matches
/// a keyword a `Tk` with `Id::Keyword` is returned instead.
named!(identifier <Tk>, do_parse!(
    name: call!(ident) >>
    (match as_keyword(name) {
            Some(tag) => tag,
            None => Tk::new(Id::Name, name, Tag::Ident)
        }
    )
));


/// First step in parsing one of the several flavors of string literals for Python.
/// Use a 1 byte lookahead to determine if the first byte matches any parsable string
/// prefix and dispatch the lexer for that particular string format.
named!(string <Tk>, do_parse!(
    token: switch!(peek!(take!(1)),
        b"#" =>  call!(sublex_comment_string)       |
        b"'" =>  call!(sublex_string)               |
        b"\"" => call!(sublex_string)               |
        b"r" =>  call!(sublex_rprefix_string)       |
        b"b" =>  call!(sublex_bprefix_string)       |
        b"f" =>  call!(sublex_fprefix_string)       ) >>
    (token)
));


/// Call the generic string sublexer for `'`, `"`, `'''`, `"""` strings
/// and tag the result as an `Id::String`.
named!(sublex_string <Tk>, do_parse!(
    bytes: sublex_string_u8 >>
    (Tk::new(Id::String, bytes, Tag::None))
));


/// Comments (`Id::Comment`) are strings that start with `#` and continue until `\n`.
named!(sublex_comment_string <Tk>, do_parse!(
    bytes: alt_complete!(
        recognize!(preceded!(tag!(b"#"), is_not!("\n"))) |
        tag!(b"#")                                       )>>
    (Tk::new(Id::Comment, bytes, Tag::None))
));


/// `r` prefixed "raw" strings, `Id::RawString`
named!(sublex_rprefix_string <Tk>, do_parse!(
    bytes: sublex_prefixed_string_u8 >>
    (Tk::new(Id::RawString, bytes, Tag::None))
));


/// `b` prefixed byte string, `Id:ByteString`
named!(sublex_bprefix_string <Tk>, do_parse!(
    bytes: sublex_prefixed_string_u8 >>
    (Tk::new(Id::ByteString, bytes, Tag::None))
));


/// `f` prefix format string, `Id::FormatString`
named!(sublex_fprefix_string <Tk>, do_parse!(
    bytes: sublex_prefixed_string_u8 >>
    (Tk::new(Id::FormatString, bytes, Tag::None))
));


/// For the known prefixed strings, remove the prefix and
/// dispatch the plain string lexer.
named!(sublex_prefixed_string_u8 <&[u8]>,  do_parse!(
    result: preceded!(
        take!(1),
        call!(sublex_string_u8)) >>
        (result)
));


/// Peek at the first byte of the current input and dispatch either
/// the single or double quote string lexers for `'` and `"` respectively.
named!(sublex_string_u8 <&[u8]>, do_parse!(
    bytes: switch!(peek!(take!(1)),
        b"'" =>  call!(sublex_squote_string_u8)  |
        b"\"" => call!(sublex_dquote_string_u8)  ) >>
    (bytes)
));


/// Peek at the first 3 characters of input. If the it is all `'''` try to parse
/// the triple-single quoted string. Otherwise a single quoted string.
named!(sublex_squote_string_u8 <&[u8]>, do_parse!(
    bytes: alt_complete!(
        switch!(peek!(take!(3)),
            b"'''" => recognize!(
                        delimited!(
                            take!(3),
                            take_until!("'''"),
                            take!(3)))                      |
            _ => recognize!(
                    delimited!(
                        tag!("'"),
                        take_until!("'"),
                        tag!("'")))
        )                                                           |
        tag!("''''''")                                              |
        tag!("''")                                                  )>>

    (bytes)
));


named!(sublex_dquote_string_u8 <&[u8]>, do_parse!(
    bytes: alt_complete!(
        switch!(peek!(take!(3)),
            b"\"\"\"" => recognize!(
                            delimited!(
                                take!(3),
                                take_until!("\"\"\""),
                                take!(3)))                  |
            _ => recognize!(
                    delimited!(
                        tag!("\""),
                        take_until!("\""),
                        tag!("\"")))
        )                                                           |
        tag!("\"\"\"\"\"\"")                                        |
        tag!("\"\"")                                                ) >>

    (bytes)
));


/// Tag all of the special symbols that can begin, terminate, or delimit an expression
/// in some way. Each symbol is tagged with it's pertinent `Id`.
named!(symbol <Tk>, do_parse!(
    token: alt!(
        tag!("(")   => { |r: &'a[u8]| (Tk::new(Id::LeftParen, r, Tag::None))       } |
        tag!("[")   => { |r: &'a[u8]| (Tk::new(Id::LeftBracket, r, Tag::None))     } |
        tag!("{")   => { |r: &'a[u8]| (Tk::new(Id::LeftBrace, r, Tag::None))       } |
        tag!("}")   => { |r: &'a[u8]| (Tk::new(Id::RightBrace, r, Tag::None))      } |
        tag!("]")   => { |r: &'a[u8]| (Tk::new(Id::RightBracket, r, Tag::None))    } |
        tag!(")")   => { |r: &'a[u8]| (Tk::new(Id::RightParen, r, Tag::None))      } |
        tag!(",")   => { |r: &'a[u8]| (Tk::new(Id::Comma, r, Tag::None))           } |
        tag!(";")   => { |r: &'a[u8]| (Tk::new(Id::Semicolon, r, Tag::None))       } |
        tag!(":")   => { |r: &'a[u8]| (Tk::new(Id::Colon, r, Tag::None))           } |
        tag!("\\")  => { |r: &'a[u8]| (Tk::new(Id::Backslash, r, Tag::None))       }) >>
    (token)
));


named!(operator <Tk>, do_parse!(
    token : alt_complete!(
            // r: &'a [u8] are the bytes captured by the tag on the LHS.
            // that is mapped with the closure to a tuple of the slice of the
            // result mapped to its appropriate tag.
            tag!(r"<<=") => { |r: &'a[u8]| (Tk::new(Id::LeftShiftEqual, r, Tag::None))    } |
            tag!(r">>=") => { |r: &'a[u8]| (Tk::new(Id::RightShiftEqual, r, Tag::None))   } |
            tag!(r"**=") => { |r: &'a[u8]| (Tk::new(Id::DoubleStarEqual, r, Tag::None))   } |
            tag!(r"//=") => { |r: &'a[u8]| (Tk::new(Id::DoubleSlashEqual, r, Tag::None))  } |
            tag!(r"...") => { |r: &'a[u8]| (Tk::new(Id::Ellipsis, r, Tag::None))          } |
            tag!(r"==") =>  { |r: &'a[u8]| (Tk::new(Id::DoubleEqual, r, Tag::None))       } |
            tag!(r"!=") =>  { |r: &'a[u8]| (Tk::new(Id::NotEqual, r, Tag::None))          } |
            tag!(r"<>") =>  { |r: &'a[u8]| (Tk::new(Id::NotEqual, r, Tag::None))          } |
            tag!(r"<=") =>  { |r: &'a[u8]| (Tk::new(Id::LessOrEqual, r, Tag::None))       } |
            tag!(r"<<") =>  { |r: &'a[u8]| (Tk::new(Id::LeftShift, r, Tag::None))         } |
            tag!(r">=") =>  { |r: &'a[u8]| (Tk::new(Id::GreaterOrEqual, r, Tag::None))    } |
            tag!(r">>") =>  { |r: &'a[u8]| (Tk::new(Id::RightShift, r, Tag::None))        } |
            tag!(r"+=") =>  { |r: &'a[u8]| (Tk::new(Id::PlusEqual, r, Tag::None))         } |
            tag!(r"-=") =>  { |r: &'a[u8]| (Tk::new(Id::MinusEqual, r, Tag::None))        } |
            tag!(r"->") =>  { |r: &'a[u8]| (Tk::new(Id::RightArrow, r, Tag::None))        } |
            tag!(r"**") =>  { |r: &'a[u8]| (Tk::new(Id::DoubleStar, r, Tag::None))        } |
            tag!(r"*=") =>  { |r: &'a[u8]| (Tk::new(Id::StarEqual, r, Tag::None))         } |
            tag!(r"//") =>  { |r: &'a[u8]| (Tk::new(Id::DoubleSlash, r, Tag::None))       } |
            tag!(r"/=") =>  { |r: &'a[u8]| (Tk::new(Id::SlashEqual, r, Tag::None))        } |
            tag!(r"|=") =>  { |r: &'a[u8]| (Tk::new(Id::PipeEqual, r, Tag::None))         } |
            tag!(r"%=") =>  { |r: &'a[u8]| (Tk::new(Id::PercentEqual, r, Tag::None))      } |
            tag!(r"&=") =>  { |r: &'a[u8]| (Tk::new(Id::AmpEqual, r, Tag::None))          } |
            tag!(r"^=") =>  { |r: &'a[u8]| (Tk::new(Id::CaretEqual, r, Tag::None))        } |
            tag!(r"@=") =>  { |r: &'a[u8]| (Tk::new(Id::AtEqual, r, Tag::None))           } |
            tag!(r"+") =>   { |r: &'a[u8]| (Tk::new(Id::Plus, r, Tag::None))              } |
            tag!(r"-") =>   { |r: &'a[u8]| (Tk::new(Id::Minus, r, Tag::None))             } |
            tag!(r"*") =>   { |r: &'a[u8]| (Tk::new(Id::Star, r, Tag::None))              } |
            tag!(r"/") =>   { |r: &'a[u8]| (Tk::new(Id::Slash, r, Tag::None))             } |
            tag!(r"|") =>   { |r: &'a[u8]| (Tk::new(Id::Pipe, r, Tag::None))              } |
            tag!(r"&") =>   { |r: &'a[u8]| (Tk::new(Id::Amp, r, Tag::None))               } |
            tag!(r"<") =>   { |r: &'a[u8]| (Tk::new(Id::LeftAngle, r, Tag::None))         } |
            tag!(r">") =>   { |r: &'a[u8]| (Tk::new(Id::RightAngle, r, Tag::None))        } |
            tag!(r"=") =>   { |r: &'a[u8]| (Tk::new(Id::Equal, r, Tag::None))             } |
            tag!(r"%") =>   { |r: &'a[u8]| (Tk::new(Id::Percent, r, Tag::None))           } |
            tag!(r"^") =>   { |r: &'a[u8]| (Tk::new(Id::Caret, r, Tag::None))             } |
            tag!(r"~") =>   { |r: &'a[u8]| (Tk::new(Id::Tilde, r, Tag::None))             } |
            tag!(r"@") =>   { |r: &'a[u8]| (Tk::new(Id::At, r, Tag::None))                } |
            tag!(r".") =>   { |r: &'a[u8]| (Tk::new(Id::Dot, r, Tag::None))               }) >>
       (token)
));


/// Use a hardcoded match expression to match if a string is a keyword.
fn as_keyword(bytes: &[u8]) -> Option<Tk> {
    let string = match str::from_utf8(bytes) {
        Ok(string) => string,
        _ => return None
    };

    match string {
        "False"     => Some(Tk::new(Id::False, bytes, Tag::None)),
        "None"      => Some(Tk::new(Id::None, bytes, Tag::None)),
        "True"      => Some(Tk::new(Id::True, bytes, Tag::None)),
        "and"       => Some(Tk::new(Id::And, bytes, Tag::None)),
        "as"        => Some(Tk::new(Id::As, bytes, Tag::None)),
        "assert"    => Some(Tk::new(Id::Assert, bytes, Tag::None)),
        "async"     => Some(Tk::new(Id::Assert, bytes, Tag::None)),
        "break"     => Some(Tk::new(Id::Break, bytes, Tag::None)),
        "class"     => Some(Tk::new(Id::Class, bytes, Tag::None)),
        "continue"  => Some(Tk::new(Id::Continue, bytes, Tag::None)),
        "def"       => Some(Tk::new(Id::Def, bytes, Tag::None)),
        "del"       => Some(Tk::new(Id::Del, bytes, Tag::None)),
        "elif"      => Some(Tk::new(Id::Elif, bytes, Tag::None)),
        "else"      => Some(Tk::new(Id::Else, bytes, Tag::None)),
        "except"    => Some(Tk::new(Id::Except, bytes, Tag::None)),
        "finally"   => Some(Tk::new(Id::Finally, bytes, Tag::None)),
        "for"       => Some(Tk::new(Id::For, bytes, Tag::None)),
        "from"      => Some(Tk::new(Id::From, bytes, Tag::None)),
        "global"    => Some(Tk::new(Id::Global, bytes, Tag::None)),
        "if"        => Some(Tk::new(Id::If, bytes, Tag::None)),
        "import"    => Some(Tk::new(Id::Import, bytes, Tag::None)),
        "in"        => Some(Tk::new(Id::In, bytes, Tag::None)),
        "is"        => Some(Tk::new(Id::Is, bytes, Tag::None)),
        "lambda"    => Some(Tk::new(Id::Lambda, bytes, Tag::None)),
        "nonlocal"  => Some(Tk::new(Id::Nonlocal, bytes, Tag::None)),
        "not"       => Some(Tk::new(Id::Not, bytes, Tag::None)),
        "or"        => Some(Tk::new(Id::Or, bytes, Tag::None)),
        "pass"      => Some(Tk::new(Id::Pass, bytes, Tag::None)),
        "raise"     => Some(Tk::new(Id::Raise, bytes, Tag::None)),
        "return"    => Some(Tk::new(Id::Return, bytes, Tag::None)),
        "try"       => Some(Tk::new(Id::Try, bytes, Tag::None)),
        "while"     => Some(Tk::new(Id::While, bytes, Tag::None)),
        "with"      => Some(Tk::new(Id::With, bytes, Tag::None)),
        "yield"     => Some(Tk::new(Id::Yield, bytes, Tag::None)),
        _           => None
    }
}


/// The Ident trait and related function `ident()` are special forms if `nom::alphanum` to
/// handle the special rules around identifiers instead of creating a more complex ident
/// parser.
pub trait Ident: where Self: AsChar {
    fn is_ident_start(&self) -> bool;
    fn is_ident(&self) -> bool;
}


/// Define the ident type for the u8 byte type like nom does with nom::AsChar.
impl Ident for u8 {
    fn is_ident_start(&self) -> bool {
        self.is_alpha() || (self.as_char() == '_' )
    }

    fn is_ident(&self) -> bool {
        self.is_alphanum() || (self.as_char() == '_' )
    }
}


/// Recognizes a python identifier in a form defined
/// by the regular expression `[_a-zA-Z][_a-zA-Z0-9]*`
pub fn ident(input: &[u8]) -> IResult<&[u8],&[u8]> {

    let input_length = input.input_len();

    if input_length == 0 {
        return IResult::Incomplete(Needed::Unknown);
    }

    for (idx, item) in input.iter_indices() {
        /// Now we get a sexy state [1 x 3] state matrix to compare
        ///  (current_index, is_ident_start_char, is_ident_continuation_char)
        ///
        match (idx, item.is_ident_start(), item.is_ident()) {
            (0, true , _   ) => continue,
            (0, false, _   ) => return IResult::Error(error_position!(ErrorKind::AlphaNumeric, input)),
            (_, _    , true) => continue,
            (_, _    , _   ) => return IResult::Done(input.slice(idx..), input.slice(0..idx))
        }
    }

    IResult::Done(input.slice(input_length..), input)
}



#[cfg(test)]
mod tests {
    use super::*;
    use ::fmt;



    /// Use to create a named test case of a single line snippet of code.
    /// This `basic_test!(print_function, "print('hello world!')`
    /// will create a test function named `print_function` that will try to parse the
    /// string.
    macro_rules! basic_test {
        ($name:ident, $code:expr, $id:expr, $tag:expr) => {
            basic_test!($name, $code, $id, $tag, true);
        };
        ($name:ident, $code:expr, $id:expr, $tag:expr, $trim:expr) => {
            #[test]
            fn $name() {
                if $trim {
                    let value = tokenize_bytes(($code).trim().as_bytes()).unwrap();
                    assert_token(&value, $id, $tag);
                } else {
                    // For matching ws
                    let value = tokenize_bytes(($code).as_bytes()).unwrap();
                    assert_token(&value, $id, $tag);
                }
            }
        };

    }


    fn assert_token(value: &(&[u8], Vec<Tk>), id: Id, tag: Tag) {
        println!("{}", fmt::tokens(&value.1, true));

        assert_eq!(value.1.len(), 1);
        let ref token = value.1[0];
        assert_eq!(token.id(), id);
        assert_eq!(token.tag(), tag);
    }


    // The venerable whitespace tokens
    basic_test!(tk_space,           " ",                Id::Space,      Tag::None,           false);
    basic_test!(tk_newline,         "\n",               Id::Newline,    Tag::W(Ws::Newline), false);

    // Numbers
    basic_test!(tk_number_int,      "12345",            Id::Number, Tag::N(Num::Int));
    basic_test!(tk_number_hex,      "0xdeadbeef12345",  Id::Number, Tag::N(Num::Hex));
    basic_test!(tk_number_oct,      "0o70721",          Id::Number, Tag::N(Num::Octal));
    basic_test!(tk_number_bin,      "0b01110",          Id::Number, Tag::N(Num::Binary));
    basic_test!(tk_number_float,    "12.45",            Id::Number, Tag::N(Num::Float));
    basic_test!(tk_number_float2,   ".45",              Id::Number, Tag::N(Num::Float));
    basic_test!(tk_number_complex,  "42j",              Id::Number, Tag::N(Num::Complex));
    basic_test!(tk_number_complex2, ".34j",             Id::Number, Tag::N(Num::Complex));

    
    basic_test!(tk_op_leftshiftequal,	    r"<<=",	Id::LeftShiftEqual,	    Tag::None);
    basic_test!(tk_op_rightshiftequal,	    r">>=",	Id::RightShiftEqual,	Tag::None);
    basic_test!(tk_op_doublestarequal,	    r"**=",	Id::DoubleStarEqual,	Tag::None);
    basic_test!(tk_op_doubleslashequal,    r"//=",	Id::DoubleSlashEqual,	Tag::None);
    basic_test!(tk_op_ellipsis,	            r"...",	Id::Ellipsis,	        Tag::None);
    basic_test!(tk_op_doubleequal,	        r"==",	Id::DoubleEqual,	    Tag::None);
    basic_test!(tk_op_notequal,	            r"!=",	Id::NotEqual,	        Tag::None);
    basic_test!(tk_op_notequal2,            r"<>",	Id::NotEqual,	        Tag::None);
    basic_test!(tk_op_lessorequal,	        r"<=",	Id::LessOrEqual,	    Tag::None);
    basic_test!(tk_op_leftshift,	        r"<<",	Id::LeftShift,	        Tag::None);
    basic_test!(tk_op_greaterorequal,	    r">=",	Id::GreaterOrEqual,	    Tag::None);
    basic_test!(tk_op_rightshift,	        r">>",	Id::RightShift,	        Tag::None);
    basic_test!(tk_op_plusequal,	        r"+=",	Id::PlusEqual,	        Tag::None);
    basic_test!(tk_op_minusequal,	        r"-=",	Id::MinusEqual,	        Tag::None);
    basic_test!(tk_op_rightarrow,	        r"->",	Id::RightArrow,	        Tag::None);
    basic_test!(tk_op_doublestar,	        r"**",	Id::DoubleStar,	        Tag::None);
    basic_test!(tk_op_starequal,	        r"*=",	Id::StarEqual,	        Tag::None);
    basic_test!(tk_op_doubleslash,	        r"//",	Id::DoubleSlash,	    Tag::None);
    basic_test!(tk_op_slashequal,	        r"/=",	Id::SlashEqual,	        Tag::None);
    basic_test!(tk_op_pipeequal,	        r"|=",	Id::PipeEqual,	        Tag::None);
    basic_test!(tk_op_percentequal, 	    r"%=",	Id::PercentEqual,	    Tag::None);
    basic_test!(tk_op_ampequal,	            r"&=",	Id::AmpEqual,	        Tag::None);
    basic_test!(tk_op_caretequal,	        r"^=",	Id::CaretEqual,	        Tag::None);
    basic_test!(tk_op_atequal,	            r"@=",	Id::AtEqual,	        Tag::None);
    basic_test!(tk_op_plus,	                r"+",	Id::Plus,	            Tag::None);
    basic_test!(tk_op_minus,	            r"-",	Id::Minus,	            Tag::None);
    basic_test!(tk_op_star,	                r"*",	Id::Star,	            Tag::None);
    basic_test!(tk_op_slash,	            r"/",	Id::Slash,	            Tag::None);
    basic_test!(tk_op_pipe,	                r"|",	Id::Pipe,	            Tag::None);
    basic_test!(tk_op_amp,	                r"&",	Id::Amp,	            Tag::None);
    basic_test!(tk_op_leftangle,	        r"<",	Id::LeftAngle,	        Tag::None);
    basic_test!(tk_op_rightangle,	        r">",	Id::RightAngle,	        Tag::None);
    basic_test!(tk_op_equal,	            r"=",	Id::Equal,	            Tag::None);
    basic_test!(tk_op_percent,	            r"%",	Id::Percent,	        Tag::None);
    basic_test!(tk_op_caret,	            r"^",	Id::Caret,	            Tag::None);
    basic_test!(tk_op_tilde,	            r"~",	Id::Tilde,	            Tag::None);
    basic_test!(tk_op_at,	                r"@",	Id::At,	                Tag::None);
    basic_test!(tk_op_dot,	                r".",	Id::Dot,	            Tag::None);


    // Keywords
    basic_test!(keyword_false,          "False",    Id::False,      Tag::None);
    basic_test!(keyword_none,           "None",     Id::None,       Tag::None);
    basic_test!(keyword_true,           "True",     Id::True,       Tag::None);
    basic_test!(keyword_and,            "and",      Id::And,        Tag::None);
    basic_test!(keyword_as,             "as",       Id::As,         Tag::None);
    basic_test!(keyword_assert,         "assert",   Id::Assert,     Tag::None);
    basic_test!(keyword_async,          "async",    Id::Assert,     Tag::None);
    basic_test!(keyword_break,          "break",    Id::Break,      Tag::None);
    basic_test!(keyword_class,          "class",    Id::Class,      Tag::None);
    basic_test!(keyword_continue,       "continue", Id::Continue,   Tag::None);
    basic_test!(keyword_def,            "def",      Id::Def,        Tag::None);
    basic_test!(keyword_del,            "del",      Id::Del,        Tag::None);
    basic_test!(keyword_elif,           "elif",     Id::Elif,       Tag::None);
    basic_test!(keyword_else,           "else",     Id::Else,       Tag::None);
    basic_test!(keyword_except,         "except",   Id::Except,     Tag::None);
    basic_test!(keyword_finally,        "finally",  Id::Finally,    Tag::None);
    basic_test!(keyword_for,            "for",      Id::For,        Tag::None);
    basic_test!(keyword_from,           "from",     Id::From,       Tag::None);
    basic_test!(keyword_global,         "global",   Id::Global,     Tag::None);
    basic_test!(keyword_if,             "if",       Id::If,         Tag::None);
    basic_test!(keyword_import,         "import",   Id::Import,     Tag::None);
    basic_test!(keyword_in,             "in",       Id::In,         Tag::None);
    basic_test!(keyword_is,             "is",       Id::Is,         Tag::None);
    basic_test!(keyword_lambda,         "lambda",   Id::Lambda,     Tag::None);
    basic_test!(keyword_nonlocal,       "nonlocal", Id::Nonlocal,   Tag::None);
    basic_test!(keyword_not,            "not",      Id::Not,        Tag::None);
    basic_test!(keyword_or,             "or",       Id::Or,         Tag::None);
    basic_test!(keyword_pass,           "pass",     Id::Pass,       Tag::None);
    basic_test!(keyword_raise,          "raise",    Id::Raise,      Tag::None);
    basic_test!(keyword_return,         "return",   Id::Return,     Tag::None);
    basic_test!(keyword_try,            "try",      Id::Try,        Tag::None);
    basic_test!(keyword_while,          "while",    Id::While,      Tag::None);
    basic_test!(keyword_with,           "with",     Id::With,       Tag::None);
    basic_test!(keyword_yield,          "yield",    Id::Yield,      Tag::None);


    #[test]
    fn tk_string() {

        // just "abc"
        let value = tokenize_bytes(r#"  "abc"  "#.trim().as_bytes()).unwrap();
        assert_token(&value, Id::String, Tag::None);

        // Double quoted strings containing single quotes are ok
        let value = tokenize_bytes(r#"  "Dillon's String!"  "#.trim().as_bytes()).unwrap();
        assert_token(&value, Id::String, Tag::None);

        // Single quoted strings containing double quotes are ok
        let value = tokenize_bytes(r#"  'Thing"s and stuff'   "#.trim().as_bytes()).unwrap();
        assert_token(&value, Id::String, Tag::None);

        // Triple double quoted multiline
        let value = tokenize_bytes(
r#"  """Line 0
Line 1
Line 2
Line 3
Line 4"""
"#.trim().as_bytes()).unwrap();
        assert_token(&value, Id::String, Tag::None);

        // Triple double quoted multiline
        let value = tokenize_bytes(
            r#"  '''alpha
beta
delta
gamma'''
"#.trim().as_bytes()).unwrap();
        assert_token(&value, Id::String, Tag::None);

        // Quoted keywords should still be strings
        let value = tokenize_bytes(r#"  'def'  "#.trim().as_bytes()).unwrap();
        assert_token(&value, Id::String, Tag::None);

        // Unicode
        let value = tokenize_bytes(r#"  "שּׂθשּׂઊ" "#.trim().as_bytes()).unwrap();
        assert_token(&value, Id::String, Tag::None);

        let value = tokenize_bytes(r#"  r'things'  "#.trim().as_bytes()).unwrap();
        assert_token(&value, Id::RawString, Tag::None);

        let value = tokenize_bytes(r#"  b'\x94\x54'  "#.trim().as_bytes()).unwrap();
        assert_token(&value, Id::ByteString, Tag::None);

        let value = tokenize_bytes(r#"  f'{number}'  "#.trim().as_bytes()).unwrap();
        assert_token(&value, Id::FormatString, Tag::None);

        let value = tokenize_bytes(
            r#"  # Never compromise, even in the face of armageddon "#.trim().as_bytes()).unwrap();
        assert_token(&value, Id::Comment, Tag::None);
    }


    #[test]
    fn tk_name() {
        let value = tokenize_bytes(r#" _hello "#.trim().as_bytes()).unwrap();
        assert_token(&value, Id::Name, Tag::Ident);
    }

   #[test]
    fn expr_x_eq_1() {
        let value = tokenize_bytes(r#"x = 1"#.as_bytes()).unwrap();
        println!("{}", fmt::tokens(&value.1, true));
    }

    #[test]
    fn module() {
        let input = [r#"x += 24354353
  y = 3
  Q -> c
  x = [1, 2, 3, 4, 5];
  \t
  global KLINGON
  \
θθθ
θclass Potato(Mike):
    def __init__(self):
        self.thing = 4
        self.more_things = 5

    # this is a comment
    def is_couch(self):
        return 'duh'
x += 24354353
  y = 3
  Q -> c
  x = [1, 2, 3, 4, 5];
  global KLINGON
  \
  "#.as_bytes(), "\t".as_bytes()].join(&(' ' as u8)).into_boxed_slice();

        let value = tokenize_bytes(&(*input)).unwrap();
        println!("{}", fmt::tokens(&value.1, true));

        let json = fmt::json(&value.1);
        println!("input size: {}", input.len());
        println!("json size: {}", json.len());
    }




}