aboutsummaryrefslogblamecommitdiffstats
path: root/CodeFragment.cpp
blob: 07d17fbef737b559513f9f91663439617ee1eab6 (plain) (tree)




















                                                                             



                                                 

                                   
                          
                   





                                 










                                                                          






















                                                                                                                      
                                






                                                                                                                      

                                                            
                                          
                                                          
                                          
                                                          
                                            
                                                            





                                                                                                                                              

                                                                                                        
                         
                                                             










                                                     
                                      





                       

                                                                             
                                        






























                                                                                                                                      


                                            


                         





























                                                                                                                                     






                                                                      
                                                                                      




                                                                 











                                                                                                           
                 








                                                                        





                                                                 
                                            













                                                                                                                                                     
                                                                                                               










                                                                                                                                                             
                                                                                                     


                                                 



                                                                           
                                                                    
                                                                                     
                                                                    
                                                                                     
















                                                                  
                                                                     
































                                                                                                                                             
                                                        
                                                        


                                                            













                                                                                                                                                                                                                                                                                                                                                                                                                                                                             
                                     











                                                                                                                 
                                                                                                                            
 
                                                               
                 
                                                                                 







                                                                    
                                                       

                                                             
                                                                     







                                                            
                                                                  





                                                              

                                                                   







                                                              
                                                                   

                                                                  
                                                         






                                                    


                                                       
                                              
                                                               





                                                   

                                                       




                                             
                                                                                           



                                                       
                                                            

                                                      


                                                            
                                          




                                                        

                                                    
                                         



                                                               

                                                       
                                          




                                             







                                                       




                                             









                                                       
                 




                                             
                                                         


                                                       
                                                         





                                                           





                                             
                                                                                 
                                                        


                                                     



                                                               
                                                                
                         
                                              

                                                            






                                                                  
                                                  

                                            
                                                                         


                                                                          
                                                                           
                                                       

                                                                               
                                 
                                                               


                                                    
                                                           

                                      
                                          




                                             





                                                       





                                                       
                                                                 
                                    
                                                              



                                                 

                                                      

                                                                                                                                              
                                                          



                                                  










                                                                         
/*
    This file is part of cpp-ethereum.

    cpp-ethereum is free software: you can redistribute it and/or modify
    it under the terms of the GNU General Public License as published by
    the Free Software Foundation, either version 3 of the License, or
    (at your option) any later version.

    cpp-ethereum is distributed in the hope that it will be useful,
    but WITHOUT ANY WARRANTY; without even the implied warranty of
    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
    GNU General Public License for more details.

    You should have received a copy of the GNU General Public License
    along with cpp-ethereum.  If not, see <http://www.gnu.org/licenses/>.
*/
/** @file CodeFragment.cpp
 * @author Gav Wood <i@gavwood.com>
 * @date 2014
 */

#include "CodeFragment.h"

#include <boost/algorithm/string.hpp>
#include <boost/spirit/include/support_utree.hpp>
#include <libethential/Log.h>
#include <libevmface/Instruction.h>
#include "CompilerState.h"
#include "Parser.h"
using namespace std;
using namespace eth;
namespace qi = boost::spirit::qi;
namespace px = boost::phoenix;
namespace sp = boost::spirit;

void CodeFragment::finalise(CompilerState const& _cs)
{
    if (_cs.usedAlloc && _cs.vars.size() && !m_finalised)
    {
        m_finalised = true;
        m_asm.injectStart(Instruction::MSTORE8);
        m_asm.injectStart((u256)((_cs.vars.size() + 2) * 32) - 1);
        m_asm.injectStart((u256)1);
    }
}

CodeFragment::CodeFragment(sp::utree const& _t, CompilerState& _s, bool _allowASM)
{
/*  cdebug << "CodeFragment. Locals:";
    for (auto const& i: _s.defs)
        cdebug << i.first << ":" << toHex(i.second.m_code);
    cdebug << "Args:";
    for (auto const& i: _s.args)
        cdebug << i.first << ":" << toHex(i.second.m_code);
    cdebug << "Outers:";
    for (auto const& i: _s.outers)
        cdebug << i.first << ":" << toHex(i.second.m_code);
    debugOutAST(cout, _t);
    cout << endl << flush;
*/
    switch (_t.which())
    {
    case sp::utree_type::list_type:
        constructOperation(_t, _s);
        break;
    case sp::utree_type::string_type:
    {
        auto sr = _t.get<sp::basic_string<boost::iterator_range<char const*>, sp::utree_type::string_type>>();
        string s(sr.begin(), sr.end());
        m_asm.append(s);
        break;
    }
    case sp::utree_type::symbol_type:
    {
        auto sr = _t.get<sp::basic_string<boost::iterator_range<char const*>, sp::utree_type::symbol_type>>();
        string s(sr.begin(), sr.end());
        string us = boost::algorithm::to_upper_copy(s);
        if (_allowASM && c_instructions.count(us))
            m_asm.append(c_instructions.at(us));
        else if (_s.defs.count(s))
            m_asm.append(_s.defs.at(s).m_asm);
        else if (_s.args.count(s))
            m_asm.append(_s.args.at(s).m_asm);
        else if (_s.outers.count(s))
            m_asm.append(_s.outers.at(s).m_asm);
        else if (us.find_first_of("1234567890") != 0 && us.find_first_not_of("QWERTYUIOPASDFGHJKLZXCVBNM1234567890_") == string::npos)
        {
            auto it = _s.vars.find(s);
            if (it == _s.vars.end())
            {
                bool ok;
                tie(it, ok) = _s.vars.insert(make_pair(s, make_pair(_s.stackSize, 32)));
                _s.stackSize += 32;
            }
            m_asm.append((u256)it->second.first);
        }
        else
            error<BareSymbol>();

        break;
    }
    case sp::utree_type::any_type:
    {
        bigint i = *_t.get<bigint*>();
        if (i < 0 || i > bigint(u256(0) - 1))
            error<IntegerOutOfRange>();
        m_asm.append((u256)i);
        break;
    }
    default: break;
    }
}

void CodeFragment::constructOperation(sp::utree const& _t, CompilerState& _s)
{
    if (_t.tag() == 0 && _t.empty())
        error<EmptyList>();
    else if (_t.tag() == 0 && _t.front().which() != sp::utree_type::symbol_type)
        error<DataNotExecutable>();
    else
    {
        string s;
        string us;
        switch (_t.tag())
        {
        case 0:
        {
            auto sr = _t.front().get<sp::basic_string<boost::iterator_range<char const*>, sp::utree_type::symbol_type>>();
            s = string(sr.begin(), sr.end());
            us = boost::algorithm::to_upper_copy(s);
            break;
        }
        case 1:
            us = "MLOAD";
            break;
        case 2:
            us = "SLOAD";
            break;
        case 3:
            us = "MSTORE";
            break;
        case 4:
            us = "SSTORE";
            break;
        case 5:
            us = "SEQ";
            break;
        case 6:
            us = "CALLDATALOAD";
            break;
        default:;
        }

        auto firstAsString = [&]()
        {
            auto i = *++_t.begin();
            if (i.tag())
                error<InvalidName>();
            if (i.which() == sp::utree_type::string_type)
            {
                auto sr = i.get<sp::basic_string<boost::iterator_range<char const*>, sp::utree_type::string_type>>();
                return string(sr.begin(), sr.end());
            }
            else if (i.which() == sp::utree_type::symbol_type)
            {
                auto sr = i.get<sp::basic_string<boost::iterator_range<char const*>, sp::utree_type::symbol_type>>();
                return _s.getDef(string(sr.begin(), sr.end())).m_asm.backString();
            }
            return string();
        };

        auto varAddress = [&](string const& n)
        {
            auto it = _s.vars.find(n);
            if (it == _s.vars.end())
            {
                bool ok;
                tie(it, ok) = _s.vars.insert(make_pair(n, make_pair(_s.stackSize, 32)));
                _s.stackSize += 32;
            }
            return it->second.first;
        };

        // Operations who args are not standard stack-pushers.
        bool nonStandard = true;
        if (us == "ASM")
        {
            int c = 0;
            for (auto const& i: _t)
                if (c++)
                    m_asm.append(CodeFragment(i, _s, true).m_asm);
        }
        else if (us == "INCLUDE")
        {
            if (_t.size() != 2)
                error<IncorrectParameterCount>();
            m_asm.append(CodeFragment::compile(asString(contents(firstAsString())), _s).m_asm);
        }
        else if (us == "SET")
        {
            if (_t.size() != 3)
                error<IncorrectParameterCount>();
            int c = 0;
            for (auto const& i: _t)
                if (c++ == 2)
                    m_asm.append(CodeFragment(i, _s, false).m_asm);
            m_asm.append((u256)varAddress(firstAsString()));
            m_asm.append(Instruction::MSTORE);
        }
        else if (us == "GET")
        {
            if (_t.size() != 2)
                error<IncorrectParameterCount>();
            m_asm.append((u256)varAddress(firstAsString()));
            m_asm.append(Instruction::MLOAD);
        }
        else if (us == "REF")
            m_asm.append((u256)varAddress(firstAsString()));
        else if (us == "DEF")
        {
            string n;
            unsigned ii = 0;
            if (_t.size() != 3 && _t.size() != 4)
                error<IncorrectParameterCount>();
            vector<string> args;
            for (auto const& i: _t)
            {
                if (ii == 1)
                {
                    if (i.tag())
                        error<InvalidName>();
                    if (i.which() == sp::utree_type::string_type)
                    {
                        auto sr = i.get<sp::basic_string<boost::iterator_range<char const*>, sp::utree_type::string_type>>();
                        n = string(sr.begin(), sr.end());
                    }
                    else if (i.which() == sp::utree_type::symbol_type)
                    {
                        auto sr = i.get<sp::basic_string<boost::iterator_range<char const*>, sp::utree_type::symbol_type>>();
                        n = _s.getDef(string(sr.begin(), sr.end())).m_asm.backString();
                    }
                }
                else if (ii == 2)
                    if (_t.size() == 3)
                        _s.defs[n] = CodeFragment(i, _s);
                    else
                        for (auto const& j: i)
                        {
                            if (j.tag() || j.which() != sp::utree_type::symbol_type)
                                error<InvalidMacroArgs>();
                            auto sr = j.get<sp::basic_string<boost::iterator_range<char const*>, sp::utree_type::symbol_type>>();
                            args.push_back(string(sr.begin(), sr.end()));
                        }
                else if (ii == 3)
                {
                    auto k = make_pair(n, args.size());
                    _s.macros[k].code = i;
                    _s.macros[k].env = _s.outers;
                    _s.macros[k].args = args;
                    for (auto const& i: _s.args)
                        _s.macros[k].env[i.first] = i.second;
                    for (auto const& i: _s.defs)
                        _s.macros[k].env[i.first] = i.second;
                }
                ++ii;
            }

        }
        else if (us == "LIT")
        {
            if (_t.size() < 3)
                error<IncorrectParameterCount>();
            unsigned ii = 0;
            CodeFragment pos;
            bytes data;
            for (auto const& i: _t)
            {
                if (ii == 1)
                {
                    pos = CodeFragment(i, _s);
                    if (pos.m_asm.deposit() != 1)
                        error<InvalidDeposit>();
                }
                else if (ii == 2 && !i.tag() && i.which() == sp::utree_type::string_type)
                {
                    auto sr = i.get<sp::basic_string<boost::iterator_range<char const*>, sp::utree_type::string_type>>();
                    data = bytes((byte const*)sr.begin(), (byte const*)sr.end());
                }
                else if (ii >= 2 && !i.tag() && i.which() == sp::utree_type::any_type)
                {
                    bigint bi = *i.get<bigint*>();
                    if (bi < 0)
                        error<IntegerOutOfRange>();
                    else if (bi > bigint(u256(0) - 1))
                    {
                        if (ii == 2 && _t.size() == 3)
                        {
                            // One big int - allow it as hex.
                            data.resize(bytesRequired(bi));
                            toBigEndian(bi, data);
                        }
                        else
                            error<IntegerOutOfRange>();
                    }
                    else
                    {
                        data.resize(data.size() + 32);
                        *(h256*)(&data.back() - 31) = (u256)bi;
                    }
                }
                else if (ii)
                    error<InvalidLiteral>();
                ++ii;
            }
            m_asm.append((u256)data.size());
            m_asm.append(Instruction::DUP1);
            m_asm.append(data);
            m_asm.append(pos.m_asm, 1);
            m_asm.append(Instruction::CODECOPY);
        }
        else
            nonStandard = false;

        if (nonStandard)
            return;

        std::map<std::string, Instruction> const c_arith = { { "+", Instruction::ADD }, { "-", Instruction::SUB }, { "*", Instruction::MUL }, { "/", Instruction::DIV }, { "%", Instruction::MOD }, { "&", Instruction::AND }, { "|", Instruction::OR }, { "^", Instruction::XOR } };
        std::map<std::string, pair<Instruction, bool>> const c_binary = { { "<", { Instruction::LT, false } }, { "<=", { Instruction::GT, true } }, { ">", { Instruction::GT, false } }, { ">=", { Instruction::LT, true } }, { "S<", { Instruction::SLT, false } }, { "S<=", { Instruction::SGT, true } }, { "S>", { Instruction::SGT, false } }, { "S>=", { Instruction::SLT, true } }, { "=", { Instruction::EQ, false } }, { "!=", { Instruction::EQ, true } } };
        std::map<std::string, Instruction> const c_unary = { { "!", Instruction::NOT } };

        vector<CodeFragment> code;
        CompilerState ns = _s;
        ns.vars.clear();
        ns.usedAlloc = false;
        int c = _t.tag() ? 1 : 0;
        for (auto const& i: _t)
            if (c++)
            {
                if (us == "LLL" && c == 1)
                    code.push_back(CodeFragment(i, ns));
                else
                    code.push_back(CodeFragment(i, _s));
            }
        auto requireSize = [&](unsigned s) { if (code.size() != s) error<IncorrectParameterCount>(); };
        auto requireMinSize = [&](unsigned s) { if (code.size() < s) error<IncorrectParameterCount>(); };
        auto requireMaxSize = [&](unsigned s) { if (code.size() > s) error<IncorrectParameterCount>(); };
        auto requireDeposit = [&](unsigned i, int s) { if (code[i].m_asm.deposit() != s) error<InvalidDeposit>(); };

        if (_s.macros.count(make_pair(s, code.size())))
        {
            Macro const& m = _s.macros.at(make_pair(s, code.size()));
            CompilerState cs = _s;
            for (auto const& i: m.env)
                cs.outers[i.first] = i.second;
            for (auto const& i: cs.defs)
                cs.outers[i.first] = i.second;
            cs.defs.clear();
            for (unsigned i = 0; i < m.args.size(); ++i)
            {
                //requireDeposit(i, 1);
                cs.args[m.args[i]] = code[i];
            }
            m_asm.append(CodeFragment(m.code, cs).m_asm);
            for (auto const& i: cs.defs)
                _s.defs[i.first] = i.second;
            for (auto const& i: cs.macros)
                _s.macros.insert(i);
        }
        else if (c_instructions.count(us))
        {
            auto it = c_instructions.find(us);
            int ea = instructionInfo(it->second).args;
            if (ea >= 0)
                requireSize(ea);
            else
                requireMinSize(-ea);

            for (unsigned i = code.size(); i; --i)
                m_asm.append(code[i - 1].m_asm, 1);
            m_asm.append(it->second);
        }
        else if (c_arith.count(us))
        {
            auto it = c_arith.find(us);
            requireMinSize(1);
            for (unsigned i = code.size(); i; --i)
            {
                requireDeposit(i - 1, 1);
                m_asm.append(code[i - 1].m_asm, 1);
            }
            for (unsigned i = 1; i < code.size(); ++i)
                m_asm.append(it->second);
        }
        else if (c_binary.count(us))
        {
            auto it = c_binary.find(us);
            requireSize(2);
            requireDeposit(0, 1);
            requireDeposit(1, 1);
            m_asm.append(code[1].m_asm, 1);
            m_asm.append(code[0].m_asm, 1);
            m_asm.append(it->second.first);
            if (it->second.second)
                m_asm.append(Instruction::NOT);
        }
        else if (c_unary.count(us))
        {
            auto it = c_unary.find(us);
            requireSize(1);
            requireDeposit(0, 1);
            m_asm.append(code[0].m_asm, 1);
            m_asm.append(it->second);
        }
        else if (us == "IF")
        {
            requireSize(3);
            requireDeposit(0, 1);
            int minDep = min(code[1].m_asm.deposit(), code[2].m_asm.deposit());

            m_asm.append(code[0].m_asm);
            auto pos = m_asm.appendJumpI();
            m_asm.onePath();
            m_asm.append(code[2].m_asm, minDep);
            auto end = m_asm.appendJump();
            m_asm.otherPath();
            m_asm << pos.tag();
            m_asm.append(code[1].m_asm, minDep);
            m_asm << end.tag();
            m_asm.donePaths();
        }
        else if (us == "WHEN" || us == "UNLESS")
        {
            requireSize(2);
            requireDeposit(0, 1);

            m_asm.append(code[0].m_asm);
            if (us == "WHEN")
                m_asm.append(Instruction::NOT);
            auto end = m_asm.appendJumpI();
            m_asm.onePath();
            m_asm.otherPath();
            m_asm.append(code[1].m_asm, 0);
            m_asm << end.tag();
            m_asm.donePaths();
        }
        else if (us == "WHILE")
        {
            requireSize(2);
            requireDeposit(0, 1);

            auto begin = m_asm.append();
            m_asm.append(code[0].m_asm);
            m_asm.append(Instruction::NOT);
            auto end = m_asm.appendJumpI();
            m_asm.append(code[1].m_asm, 0);
            m_asm.appendJump(begin);
            m_asm << end.tag();
        }
        else if (us == "FOR")
        {
            requireSize(4);
            requireDeposit(1, 1);

            m_asm.append(code[0].m_asm, 0);
            auto begin = m_asm.append();
            m_asm.append(code[1].m_asm);
            m_asm.append(Instruction::NOT);
            auto end = m_asm.appendJumpI();
            m_asm.append(code[3].m_asm, 0);
            m_asm.append(code[2].m_asm, 0);
            m_asm.appendJump(begin);
            m_asm << end.tag();
        }
        else if (us == "ALLOC")
        {
            requireSize(1);
            requireDeposit(0, 1);

            m_asm.append(Instruction::MSIZE);
            m_asm.append(u256(0));
            m_asm.append(u256(1));
            m_asm.append(code[0].m_asm, 1);
            m_asm.append(Instruction::MSIZE);
            m_asm.append(Instruction::ADD);
            m_asm.append(Instruction::SUB);
            m_asm.append(Instruction::MSTORE8);

            _s.usedAlloc = true;
        }
        else if (us == "LLL")
        {
            requireMinSize(2);
            requireMaxSize(3);
            requireDeposit(1, 1);

            auto subPush = m_asm.appendSubSize(code[0].assembly(ns));
            m_asm.append(Instruction::DUP1);
            if (code.size() == 3)
            {
                requireDeposit(2, 1);
                m_asm.append(code[2].m_asm, 1);
                m_asm.append(Instruction::LT);
                m_asm.append(Instruction::NOT);
                m_asm.append(Instruction::MUL);
                m_asm.append(Instruction::DUP1);
            }
            m_asm.append(subPush);
            m_asm.append(code[1].m_asm, 1);
            m_asm.append(Instruction::CODECOPY);
        }
        else if (us == "&&" || us == "||")
        {
            requireMinSize(1);
            for (unsigned i = 0; i < code.size(); ++i)
                requireDeposit(i, 1);

            auto end = m_asm.newTag();
            if (code.size() > 1)
            {
                m_asm.append((u256)(us == "||" ? 1 : 0));
                for (unsigned i = 1; i < code.size(); ++i)
                {
                    // Check if true - predicate
                    m_asm.append(code[i - 1].m_asm, 1);
                    if (us == "&&")
                        m_asm.append(Instruction::NOT);
                    m_asm.appendJumpI(end);
                }
                m_asm.append(Instruction::POP);
            }

            // Check if true - predicate
            m_asm.append(code.back().m_asm, 1);

            // At end now.
            m_asm.append(end);
        }
        else if (us == "~")
        {
            requireSize(1);
            requireDeposit(0, 1);

            m_asm.append(code[0].m_asm, 1);
            m_asm.append((u256)1);
            m_asm.append((u256)0);
            m_asm.append(Instruction::SUB);
            m_asm.append(Instruction::SUB);
        }
        else if (us == "SEQ")
        {
            unsigned ii = 0;
            for (auto const& i: code)
                if (++ii < code.size())
                    m_asm.append(i.m_asm, 0);
                else
                    m_asm.append(i.m_asm);
        }
        else if (us == "RAW")
        {
            for (auto const& i: code)
                m_asm.append(i.m_asm);
            m_asm.popTo(1);
        }
        else if (us.find_first_of("1234567890") != 0 && us.find_first_not_of("QWERTYUIOPASDFGHJKLZXCVBNM1234567890_") == string::npos)
            m_asm.append((u256)varAddress(s));
        else
            error<InvalidOperation>();
    }
}

CodeFragment CodeFragment::compile(string const& _src, CompilerState& _s)
{
    CodeFragment ret;
    sp::utree o;
    parseTreeLLL(_src, o);
    if (!o.empty())
        ret = CodeFragment(o, _s);
    _s.treesToKill.push_back(o);
    return ret;
}