pocketpy.h 31 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826
  1. #pragma once
  2. #include "vm.h"
  3. #include "compiler.h"
  4. #include "repl.h"
  5. _Code VM::compile(_Str source, _Str filename, CompileMode mode) {
  6. Compiler compiler(this, source.c_str(), filename, mode);
  7. try{
  8. return compiler.__fillCode();
  9. }catch(_Error& e){
  10. throw e;
  11. }catch(std::exception& e){
  12. throw CompileError("UnexpectedError", e.what(), compiler.getLineSnapshot());
  13. }
  14. }
  15. #define BIND_NUM_ARITH_OPT(name, op) \
  16. _vm->bindMethodMulti<1>({"int","float"}, #name, [](VM* vm, const pkpy::ArgList& args){ \
  17. if(args[0]->is_type(vm->_tp_int) && args[1]->is_type(vm->_tp_int)){ \
  18. return vm->PyInt(vm->PyInt_AS_C(args[0]) op vm->PyInt_AS_C(args[1])); \
  19. }else{ \
  20. return vm->PyFloat(vm->num_to_float(args[0]) op vm->num_to_float(args[1])); \
  21. } \
  22. });
  23. #define BIND_NUM_LOGICAL_OPT(name, op, is_eq) \
  24. _vm->bindMethodMulti<1>({"int","float"}, #name, [](VM* vm, const pkpy::ArgList& args){ \
  25. if(!vm->is_int_or_float(args[0], args[1])){ \
  26. if constexpr(is_eq) return vm->PyBool(args[0] == args[1]); \
  27. vm->typeError("unsupported operand type(s) for " #op ); \
  28. } \
  29. return vm->PyBool(vm->num_to_float(args[0]) op vm->num_to_float(args[1])); \
  30. });
  31. void __initializeBuiltinFunctions(VM* _vm) {
  32. BIND_NUM_ARITH_OPT(__add__, +)
  33. BIND_NUM_ARITH_OPT(__sub__, -)
  34. BIND_NUM_ARITH_OPT(__mul__, *)
  35. BIND_NUM_LOGICAL_OPT(__lt__, <, false)
  36. BIND_NUM_LOGICAL_OPT(__le__, <=, false)
  37. BIND_NUM_LOGICAL_OPT(__gt__, >, false)
  38. BIND_NUM_LOGICAL_OPT(__ge__, >=, false)
  39. BIND_NUM_LOGICAL_OPT(__eq__, ==, true)
  40. #undef BIND_NUM_ARITH_OPT
  41. #undef BIND_NUM_LOGICAL_OPT
  42. _vm->bindBuiltinFunc<1>("__sys_stdout_write", [](VM* vm, const pkpy::ArgList& args) {
  43. (*vm->_stdout) << vm->PyStr_AS_C(args[0]);
  44. return vm->None;
  45. });
  46. _vm->bindBuiltinFunc<0>("super", [](VM* vm, const pkpy::ArgList& args) {
  47. auto it = vm->top_frame()->f_locals.find(m_self);
  48. if(it == vm->top_frame()->f_locals.end()) vm->typeError("super() can only be called in a class method");
  49. return vm->new_object(vm->_tp_super, it->second);
  50. });
  51. _vm->bindBuiltinFunc<1>("eval", [](VM* vm, const pkpy::ArgList& args) {
  52. const _Str& expr = vm->PyStr_AS_C(args[0]);
  53. _Code code = vm->compile(expr, "<eval>", EVAL_MODE);
  54. return vm->_exec(code, vm->top_frame()->_module, vm->top_frame()->f_locals_copy());
  55. });
  56. _vm->bindBuiltinFunc<1>("repr", CPP_LAMBDA(vm->asRepr(args[0])));
  57. _vm->bindBuiltinFunc<1>("hash", CPP_LAMBDA(vm->PyInt(vm->hash(args[0]))));
  58. _vm->bindBuiltinFunc<1>("len", CPP_LAMBDA(vm->call(args[0], __len__, pkpy::noArg())));
  59. _vm->bindBuiltinFunc<1>("chr", [](VM* vm, const pkpy::ArgList& args) {
  60. i64 i = vm->PyInt_AS_C(args[0]);
  61. if (i < 0 || i > 128) vm->valueError("chr() arg not in range(128)");
  62. return vm->PyStr(std::string(1, (char)i));
  63. });
  64. _vm->bindBuiltinFunc<1>("ord", [](VM* vm, const pkpy::ArgList& args) {
  65. _Str s = vm->PyStr_AS_C(args[0]);
  66. if (s.size() != 1) vm->typeError("ord() expected an ASCII character");
  67. return vm->PyInt((i64)s[0]);
  68. });
  69. _vm->bindBuiltinFunc<0>("globals", [](VM* vm, const pkpy::ArgList& args) {
  70. const auto& d = vm->top_frame()->f_globals();
  71. PyVar obj = vm->call(vm->builtins->attribs["dict"]);
  72. for (const auto& [k, v] : d) {
  73. vm->call(obj, __setitem__, pkpy::twoArgs(vm->PyStr(k), v));
  74. }
  75. return obj;
  76. });
  77. _vm->bindBuiltinFunc<0>("locals", [](VM* vm, const pkpy::ArgList& args) {
  78. const auto& d = vm->top_frame()->f_locals;
  79. PyVar obj = vm->call(vm->builtins->attribs["dict"]);
  80. for (const auto& [k, v] : d) {
  81. vm->call(obj, __setitem__, pkpy::twoArgs(vm->PyStr(k), v));
  82. }
  83. return obj;
  84. });
  85. _vm->bindBuiltinFunc<1>("hex", [](VM* vm, const pkpy::ArgList& args) {
  86. std::stringstream ss;
  87. ss << std::hex << vm->PyInt_AS_C(args[0]);
  88. return vm->PyStr("0x" + ss.str());
  89. });
  90. _vm->bindBuiltinFunc<1>("dir", [](VM* vm, const pkpy::ArgList& args) {
  91. std::vector<_Str> names;
  92. for (auto& [k, _] : args[0]->attribs) names.push_back(k);
  93. for (auto& [k, _] : args[0]->_type->attribs) {
  94. if (k.find("__") == 0) continue;
  95. if (std::find(names.begin(), names.end(), k) == names.end()) names.push_back(k);
  96. }
  97. PyVarList ret;
  98. for (const auto& name : names) ret.push_back(vm->PyStr(name));
  99. std::sort(ret.begin(), ret.end(), [vm](const PyVar& a, const PyVar& b) {
  100. return vm->PyStr_AS_C(a) < vm->PyStr_AS_C(b);
  101. });
  102. return vm->PyList(ret);
  103. });
  104. _vm->bindMethod<0>("object", "__repr__", [](VM* vm, const pkpy::ArgList& args) {
  105. PyVar _self = args[0];
  106. std::stringstream ss;
  107. ss << std::hex << (uintptr_t)_self.get();
  108. _Str s = "<" + UNION_TP_NAME(_self) + " object at 0x" + ss.str() + ">";
  109. return vm->PyStr(s);
  110. });
  111. _vm->bindMethod<1>("object", "__eq__", CPP_LAMBDA(vm->PyBool(args[0] == args[1])));
  112. _vm->bindStaticMethod<1>("type", "__new__", CPP_LAMBDA(args[0]->_type));
  113. _vm->bindStaticMethod<-1>("range", "__new__", [](VM* vm, const pkpy::ArgList& args) {
  114. _Range r;
  115. switch (args.size()) {
  116. case 1: r.stop = vm->PyInt_AS_C(args[0]); break;
  117. case 2: r.start = vm->PyInt_AS_C(args[0]); r.stop = vm->PyInt_AS_C(args[1]); break;
  118. case 3: r.start = vm->PyInt_AS_C(args[0]); r.stop = vm->PyInt_AS_C(args[1]); r.step = vm->PyInt_AS_C(args[2]); break;
  119. default: vm->typeError("expected 1-3 arguments, but got " + std::to_string(args.size()));
  120. }
  121. return vm->PyRange(r);
  122. });
  123. _vm->bindMethod<0>("range", "__iter__", CPP_LAMBDA(
  124. vm->PyIter(pkpy::make_shared<BaseIterator, RangeIterator>(vm, args[0]))
  125. ));
  126. _vm->bindMethod<0>("NoneType", "__repr__", CPP_LAMBDA(vm->PyStr("None")));
  127. _vm->bindMethod<0>("NoneType", "__json__", CPP_LAMBDA(vm->PyStr("null")));
  128. _vm->bindMethodMulti<1>({"int", "float"}, "__truediv__", [](VM* vm, const pkpy::ArgList& args) {
  129. f64 rhs = vm->num_to_float(args[1]);
  130. if (rhs == 0) vm->zeroDivisionError();
  131. return vm->PyFloat(vm->num_to_float(args[0]) / rhs);
  132. });
  133. _vm->bindMethodMulti<1>({"int", "float"}, "__pow__", [](VM* vm, const pkpy::ArgList& args) {
  134. if(args[0]->is_type(vm->_tp_int) && args[1]->is_type(vm->_tp_int)){
  135. return vm->PyInt((i64)round(pow(vm->PyInt_AS_C(args[0]), vm->PyInt_AS_C(args[1]))));
  136. }else{
  137. return vm->PyFloat((f64)pow(vm->num_to_float(args[0]), vm->num_to_float(args[1])));
  138. }
  139. });
  140. /************ PyInt ************/
  141. _vm->bindStaticMethod<1>("int", "__new__", [](VM* vm, const pkpy::ArgList& args) {
  142. if (args[0]->is_type(vm->_tp_int)) return args[0];
  143. if (args[0]->is_type(vm->_tp_float)) return vm->PyInt((i64)vm->PyFloat_AS_C(args[0]));
  144. if (args[0]->is_type(vm->_tp_bool)) return vm->PyInt(vm->PyBool_AS_C(args[0]) ? 1 : 0);
  145. if (args[0]->is_type(vm->_tp_str)) {
  146. const _Str& s = vm->PyStr_AS_C(args[0]);
  147. try{
  148. size_t parsed = 0;
  149. i64 val = std::stoll(s, &parsed, 10);
  150. if(parsed != s.size()) throw std::invalid_argument("");
  151. return vm->PyInt(val);
  152. }catch(std::invalid_argument&){
  153. vm->valueError("invalid literal for int(): '" + s + "'");
  154. }
  155. }
  156. vm->typeError("int() argument must be a int, float, bool or str");
  157. return vm->None;
  158. });
  159. _vm->bindMethod<1>("int", "__floordiv__", [](VM* vm, const pkpy::ArgList& args) {
  160. i64 rhs = vm->PyInt_AS_C(args[1]);
  161. if(rhs == 0) vm->zeroDivisionError();
  162. return vm->PyInt(vm->PyInt_AS_C(args[0]) / rhs);
  163. });
  164. _vm->bindMethod<1>("int", "__mod__", [](VM* vm, const pkpy::ArgList& args) {
  165. i64 rhs = vm->PyInt_AS_C(args[1]);
  166. if(rhs == 0) vm->zeroDivisionError();
  167. return vm->PyInt(vm->PyInt_AS_C(args[0]) % rhs);
  168. });
  169. _vm->bindMethod<0>("int", "__repr__", [](VM* vm, const pkpy::ArgList& args) {
  170. return vm->PyStr(std::to_string(vm->PyInt_AS_C(args[0])));
  171. });
  172. _vm->bindMethod<0>("int", "__json__", [](VM* vm, const pkpy::ArgList& args) {
  173. return vm->PyStr(std::to_string((int)vm->PyInt_AS_C(args[0])));
  174. });
  175. #define __INT_BITWISE_OP(name,op) \
  176. _vm->bindMethod<1>("int", #name, [](VM* vm, const pkpy::ArgList& args) { \
  177. return vm->PyInt(vm->PyInt_AS_C(args[0]) op vm->PyInt_AS_C(args[1])); \
  178. });
  179. __INT_BITWISE_OP(__lshift__, <<)
  180. __INT_BITWISE_OP(__rshift__, >>)
  181. __INT_BITWISE_OP(__and__, &)
  182. __INT_BITWISE_OP(__or__, |)
  183. __INT_BITWISE_OP(__xor__, ^)
  184. #undef __INT_BITWISE_OP
  185. /************ PyFloat ************/
  186. _vm->bindStaticMethod<1>("float", "__new__", [](VM* vm, const pkpy::ArgList& args) {
  187. if (args[0]->is_type(vm->_tp_int)) return vm->PyFloat((f64)vm->PyInt_AS_C(args[0]));
  188. if (args[0]->is_type(vm->_tp_float)) return args[0];
  189. if (args[0]->is_type(vm->_tp_bool)) return vm->PyFloat(vm->PyBool_AS_C(args[0]) ? 1.0 : 0.0);
  190. if (args[0]->is_type(vm->_tp_str)) {
  191. const _Str& s = vm->PyStr_AS_C(args[0]);
  192. if(s == "inf") return vm->PyFloat(INFINITY);
  193. if(s == "-inf") return vm->PyFloat(-INFINITY);
  194. try{
  195. f64 val = std::stod(s);
  196. return vm->PyFloat(val);
  197. }catch(std::invalid_argument&){
  198. vm->valueError("invalid literal for float(): '" + s + "'");
  199. }
  200. }
  201. vm->typeError("float() argument must be a int, float, bool or str");
  202. return vm->None;
  203. });
  204. _vm->bindMethod<0>("float", "__repr__", [](VM* vm, const pkpy::ArgList& args) {
  205. f64 val = vm->PyFloat_AS_C(args[0]);
  206. if(std::isinf(val) || std::isnan(val)) return vm->PyStr(std::to_string(val));
  207. _StrStream ss;
  208. ss << std::setprecision(std::numeric_limits<f64>::max_digits10-1) << val;
  209. std::string s = ss.str();
  210. if(std::all_of(s.begin()+1, s.end(), isdigit)) s += ".0";
  211. return vm->PyStr(s);
  212. });
  213. _vm->bindMethod<0>("float", "__json__", [](VM* vm, const pkpy::ArgList& args) {
  214. f64 val = vm->PyFloat_AS_C(args[0]);
  215. if(std::isinf(val) || std::isnan(val)) vm->valueError("cannot jsonify 'nan' or 'inf'");
  216. return vm->PyStr(std::to_string(val));
  217. });
  218. /************ PyString ************/
  219. _vm->bindStaticMethod<1>("str", "__new__", CPP_LAMBDA(vm->asStr(args[0])));
  220. _vm->bindMethod<1>("str", "__add__", [](VM* vm, const pkpy::ArgList& args) {
  221. const _Str& lhs = vm->PyStr_AS_C(args[0]);
  222. const _Str& rhs = vm->PyStr_AS_C(args[1]);
  223. return vm->PyStr(lhs + rhs);
  224. });
  225. _vm->bindMethod<0>("str", "__len__", [](VM* vm, const pkpy::ArgList& args) {
  226. const _Str& _self = vm->PyStr_AS_C(args[0]);
  227. return vm->PyInt(_self.u8_length());
  228. });
  229. _vm->bindMethod<1>("str", "__contains__", [](VM* vm, const pkpy::ArgList& args) {
  230. const _Str& _self = vm->PyStr_AS_C(args[0]);
  231. const _Str& _other = vm->PyStr_AS_C(args[1]);
  232. return vm->PyBool(_self.find(_other) != _Str::npos);
  233. });
  234. _vm->bindMethod<0>("str", "__str__", CPP_LAMBDA(args[0]));
  235. _vm->bindMethod<0>("str", "__iter__", CPP_LAMBDA(
  236. vm->PyIter(pkpy::make_shared<BaseIterator, StringIterator>(vm, args[0]))
  237. ));
  238. _vm->bindMethod<0>("str", "__repr__", [](VM* vm, const pkpy::ArgList& args) {
  239. const _Str& _self = vm->PyStr_AS_C(args[0]);
  240. return vm->PyStr(_self.__escape(true));
  241. });
  242. _vm->bindMethod<0>("str", "__json__", [](VM* vm, const pkpy::ArgList& args) {
  243. const _Str& _self = vm->PyStr_AS_C(args[0]);
  244. return vm->PyStr(_self.__escape(false));
  245. });
  246. _vm->bindMethod<1>("str", "__eq__", [](VM* vm, const pkpy::ArgList& args) {
  247. if(args[0]->is_type(vm->_tp_str) && args[1]->is_type(vm->_tp_str))
  248. return vm->PyBool(vm->PyStr_AS_C(args[0]) == vm->PyStr_AS_C(args[1]));
  249. return vm->PyBool(args[0] == args[1]);
  250. });
  251. _vm->bindMethod<1>("str", "__getitem__", [](VM* vm, const pkpy::ArgList& args) {
  252. const _Str& _self (vm->PyStr_AS_C(args[0]));
  253. if(args[1]->is_type(vm->_tp_slice)){
  254. _Slice s = vm->PySlice_AS_C(args[1]);
  255. s.normalize(_self.u8_length());
  256. return vm->PyStr(_self.u8_substr(s.start, s.stop));
  257. }
  258. int _index = (int)vm->PyInt_AS_C(args[1]);
  259. _index = vm->normalizedIndex(_index, _self.u8_length());
  260. return vm->PyStr(_self.u8_getitem(_index));
  261. });
  262. _vm->bindMethod<1>("str", "__gt__", [](VM* vm, const pkpy::ArgList& args) {
  263. const _Str& _self (vm->PyStr_AS_C(args[0]));
  264. const _Str& _obj (vm->PyStr_AS_C(args[1]));
  265. return vm->PyBool(_self > _obj);
  266. });
  267. _vm->bindMethod<1>("str", "__lt__", [](VM* vm, const pkpy::ArgList& args) {
  268. const _Str& _self (vm->PyStr_AS_C(args[0]));
  269. const _Str& _obj (vm->PyStr_AS_C(args[1]));
  270. return vm->PyBool(_self < _obj);
  271. });
  272. _vm->bindMethod<2>("str", "replace", [](VM* vm, const pkpy::ArgList& args) {
  273. const _Str& _self = vm->PyStr_AS_C(args[0]);
  274. const _Str& _old = vm->PyStr_AS_C(args[1]);
  275. const _Str& _new = vm->PyStr_AS_C(args[2]);
  276. _Str _copy = _self;
  277. // replace all occurences of _old with _new in _copy
  278. size_t pos = 0;
  279. while ((pos = _copy.find(_old, pos)) != std::string::npos) {
  280. _copy.replace(pos, _old.length(), _new);
  281. pos += _new.length();
  282. }
  283. return vm->PyStr(_copy);
  284. });
  285. _vm->bindMethod<1>("str", "startswith", [](VM* vm, const pkpy::ArgList& args) {
  286. const _Str& _self = vm->PyStr_AS_C(args[0]);
  287. const _Str& _prefix = vm->PyStr_AS_C(args[1]);
  288. return vm->PyBool(_self.find(_prefix) == 0);
  289. });
  290. _vm->bindMethod<1>("str", "endswith", [](VM* vm, const pkpy::ArgList& args) {
  291. const _Str& _self = vm->PyStr_AS_C(args[0]);
  292. const _Str& _suffix = vm->PyStr_AS_C(args[1]);
  293. return vm->PyBool(_self.rfind(_suffix) == _self.length() - _suffix.length());
  294. });
  295. _vm->bindMethod<1>("str", "join", [](VM* vm, const pkpy::ArgList& args) {
  296. const _Str& _self = vm->PyStr_AS_C(args[0]);
  297. PyVarList* _list;
  298. if(args[1]->is_type(vm->_tp_list)){
  299. _list = &vm->PyList_AS_C(args[1]);
  300. }else if(args[1]->is_type(vm->_tp_tuple)){
  301. _list = &vm->PyTuple_AS_C(args[1]);
  302. }else{
  303. vm->typeError("can only join a list or tuple");
  304. }
  305. _StrStream ss;
  306. for(int i = 0; i < _list->size(); i++){
  307. if(i > 0) ss << _self;
  308. ss << vm->PyStr_AS_C(vm->asStr(_list->operator[](i)));
  309. }
  310. return vm->PyStr(ss.str());
  311. });
  312. /************ PyList ************/
  313. _vm->bindMethod<0>("list", "__iter__", [](VM* vm, const pkpy::ArgList& args) {
  314. return vm->PyIter(
  315. pkpy::make_shared<BaseIterator, VectorIterator>(vm, args[0])
  316. );
  317. });
  318. _vm->bindMethod<1>("list", "append", [](VM* vm, const pkpy::ArgList& args) {
  319. PyVarList& _self = vm->PyList_AS_C(args[0]);
  320. _self.push_back(args[1]);
  321. return vm->None;
  322. });
  323. _vm->bindMethod<2>("list", "insert", [](VM* vm, const pkpy::ArgList& args) {
  324. PyVarList& _self = vm->PyList_AS_C(args[0]);
  325. int _index = (int)vm->PyInt_AS_C(args[1]);
  326. if(_index < 0) _index += _self.size();
  327. if(_index < 0) _index = 0;
  328. if(_index > _self.size()) _index = _self.size();
  329. _self.insert(_self.begin() + _index, args[2]);
  330. return vm->None;
  331. });
  332. _vm->bindMethod<0>("list", "clear", [](VM* vm, const pkpy::ArgList& args) {
  333. vm->PyList_AS_C(args[0]).clear();
  334. return vm->None;
  335. });
  336. _vm->bindMethod<0>("list", "copy", [](VM* vm, const pkpy::ArgList& args) {
  337. return vm->PyList(vm->PyList_AS_C(args[0]));
  338. });
  339. _vm->bindMethod<1>("list", "__add__", [](VM* vm, const pkpy::ArgList& args) {
  340. const PyVarList& _self = vm->PyList_AS_C(args[0]);
  341. const PyVarList& _obj = vm->PyList_AS_C(args[1]);
  342. PyVarList _new_list = _self;
  343. _new_list.insert(_new_list.end(), _obj.begin(), _obj.end());
  344. return vm->PyList(_new_list);
  345. });
  346. _vm->bindMethod<0>("list", "__len__", [](VM* vm, const pkpy::ArgList& args) {
  347. const PyVarList& _self = vm->PyList_AS_C(args[0]);
  348. return vm->PyInt(_self.size());
  349. });
  350. _vm->bindMethod<1>("list", "__getitem__", [](VM* vm, const pkpy::ArgList& args) {
  351. const PyVarList& _self = vm->PyList_AS_C(args[0]);
  352. if(args[1]->is_type(vm->_tp_slice)){
  353. _Slice s = vm->PySlice_AS_C(args[1]);
  354. s.normalize(_self.size());
  355. PyVarList _new_list;
  356. for(size_t i = s.start; i < s.stop; i++)
  357. _new_list.push_back(_self[i]);
  358. return vm->PyList(_new_list);
  359. }
  360. int _index = (int)vm->PyInt_AS_C(args[1]);
  361. _index = vm->normalizedIndex(_index, _self.size());
  362. return _self[_index];
  363. });
  364. _vm->bindMethod<2>("list", "__setitem__", [](VM* vm, const pkpy::ArgList& args) {
  365. PyVarList& _self = vm->PyList_AS_C(args[0]);
  366. int _index = (int)vm->PyInt_AS_C(args[1]);
  367. _index = vm->normalizedIndex(_index, _self.size());
  368. _self[_index] = args[2];
  369. return vm->None;
  370. });
  371. _vm->bindMethod<1>("list", "__delitem__", [](VM* vm, const pkpy::ArgList& args) {
  372. PyVarList& _self = vm->PyList_AS_C(args[0]);
  373. int _index = (int)vm->PyInt_AS_C(args[1]);
  374. _index = vm->normalizedIndex(_index, _self.size());
  375. _self.erase(_self.begin() + _index);
  376. return vm->None;
  377. });
  378. /************ PyTuple ************/
  379. _vm->bindStaticMethod<1>("tuple", "__new__", [](VM* vm, const pkpy::ArgList& args) {
  380. PyVarList _list = vm->PyList_AS_C(vm->call(vm->builtins->attribs["list"], args));
  381. return vm->PyTuple(_list);
  382. });
  383. _vm->bindMethod<0>("tuple", "__iter__", [](VM* vm, const pkpy::ArgList& args) {
  384. return vm->PyIter(pkpy::make_shared<BaseIterator, VectorIterator>(vm, args[0]));
  385. });
  386. _vm->bindMethod<0>("tuple", "__len__", [](VM* vm, const pkpy::ArgList& args) {
  387. const PyVarList& _self = vm->PyTuple_AS_C(args[0]);
  388. return vm->PyInt(_self.size());
  389. });
  390. _vm->bindMethod<1>("tuple", "__getitem__", [](VM* vm, const pkpy::ArgList& args) {
  391. const PyVarList& _self = vm->PyTuple_AS_C(args[0]);
  392. int _index = (int)vm->PyInt_AS_C(args[1]);
  393. _index = vm->normalizedIndex(_index, _self.size());
  394. return _self[_index];
  395. });
  396. /************ PyBool ************/
  397. _vm->bindStaticMethod<1>("bool", "__new__", CPP_LAMBDA(vm->asBool(args[0])));
  398. _vm->bindMethod<0>("bool", "__repr__", [](VM* vm, const pkpy::ArgList& args) {
  399. bool val = vm->PyBool_AS_C(args[0]);
  400. return vm->PyStr(val ? "True" : "False");
  401. });
  402. _vm->bindMethod<0>("bool", "__json__", [](VM* vm, const pkpy::ArgList& args) {
  403. bool val = vm->PyBool_AS_C(args[0]);
  404. return vm->PyStr(val ? "true" : "false");
  405. });
  406. _vm->bindMethod<1>("bool", "__xor__", [](VM* vm, const pkpy::ArgList& args) {
  407. bool _self = vm->PyBool_AS_C(args[0]);
  408. bool _obj = vm->PyBool_AS_C(args[1]);
  409. return vm->PyBool(_self ^ _obj);
  410. });
  411. _vm->bindMethod<0>("ellipsis", "__repr__", CPP_LAMBDA(vm->PyStr("Ellipsis")));
  412. }
  413. #include "builtins.h"
  414. #ifdef _WIN32
  415. #define __EXPORT __declspec(dllexport)
  416. #elif __APPLE__
  417. #define __EXPORT __attribute__((visibility("default"))) __attribute__((used))
  418. #elif __EMSCRIPTEN__
  419. #define __EXPORT EMSCRIPTEN_KEEPALIVE
  420. #define __NO_MAIN
  421. #else
  422. #define __EXPORT
  423. #endif
  424. void __addModuleTime(VM* vm){
  425. PyVar mod = vm->newModule("time");
  426. vm->bindFunc<0>(mod, "time", [](VM* vm, const pkpy::ArgList& args) {
  427. auto now = std::chrono::high_resolution_clock::now();
  428. return vm->PyFloat(std::chrono::duration_cast<std::chrono::microseconds>(now.time_since_epoch()).count() / 1000000.0);
  429. });
  430. }
  431. void __addModuleSys(VM* vm){
  432. PyVar mod = vm->newModule("sys");
  433. vm->bindFunc<1>(mod, "getrefcount", [](VM* vm, const pkpy::ArgList& args) {
  434. return vm->PyInt(args[0].use_count());
  435. });
  436. vm->bindFunc<0>(mod, "getrecursionlimit", [](VM* vm, const pkpy::ArgList& args) {
  437. return vm->PyInt(vm->maxRecursionDepth);
  438. });
  439. vm->bindFunc<1>(mod, "setrecursionlimit", [](VM* vm, const pkpy::ArgList& args) {
  440. vm->maxRecursionDepth = (int)vm->PyInt_AS_C(args[0]);
  441. return vm->None;
  442. });
  443. vm->setattr(mod, "version", vm->PyStr(PK_VERSION));
  444. }
  445. void __addModuleJson(VM* vm){
  446. PyVar mod = vm->newModule("json");
  447. vm->bindFunc<1>(mod, "loads", [](VM* vm, const pkpy::ArgList& args) {
  448. const _Str& expr = vm->PyStr_AS_C(args[0]);
  449. _Code code = vm->compile(expr, "<json>", JSON_MODE);
  450. return vm->_exec(code, vm->top_frame()->_module, vm->top_frame()->f_locals_copy());
  451. });
  452. vm->bindFunc<1>(mod, "dumps", [](VM* vm, const pkpy::ArgList& args) {
  453. return vm->asJson(args[0]);
  454. });
  455. }
  456. void __addModuleMath(VM* vm){
  457. PyVar mod = vm->newModule("math");
  458. vm->setattr(mod, "pi", vm->PyFloat(3.1415926535897932384));
  459. vm->setattr(mod, "e" , vm->PyFloat(2.7182818284590452354));
  460. vm->bindFunc<1>(mod, "log", [](VM* vm, const pkpy::ArgList& args) {
  461. return vm->PyFloat(log(vm->num_to_float(args[0])));
  462. });
  463. vm->bindFunc<1>(mod, "log10", [](VM* vm, const pkpy::ArgList& args) {
  464. return vm->PyFloat(log10(vm->num_to_float(args[0])));
  465. });
  466. vm->bindFunc<1>(mod, "log2", [](VM* vm, const pkpy::ArgList& args) {
  467. return vm->PyFloat(log2(vm->num_to_float(args[0])));
  468. });
  469. vm->bindFunc<1>(mod, "sin", [](VM* vm, const pkpy::ArgList& args) {
  470. return vm->PyFloat(sin(vm->num_to_float(args[0])));
  471. });
  472. vm->bindFunc<1>(mod, "cos", [](VM* vm, const pkpy::ArgList& args) {
  473. return vm->PyFloat(cos(vm->num_to_float(args[0])));
  474. });
  475. vm->bindFunc<1>(mod, "tan", [](VM* vm, const pkpy::ArgList& args) {
  476. return vm->PyFloat(tan(vm->num_to_float(args[0])));
  477. });
  478. vm->bindFunc<2>(mod, "isclose", [](VM* vm, const pkpy::ArgList& args) {
  479. f64 a = vm->num_to_float(args[0]);
  480. f64 b = vm->num_to_float(args[1]);
  481. return vm->PyBool(fabs(a - b) < 1e-9);
  482. });
  483. vm->bindFunc<1>(mod, "isnan", [](VM* vm, const pkpy::ArgList& args) {
  484. return vm->PyBool(std::isnan(vm->num_to_float(args[0])));
  485. });
  486. vm->bindFunc<1>(mod, "isinf", [](VM* vm, const pkpy::ArgList& args) {
  487. return vm->PyBool(std::isinf(vm->num_to_float(args[0])));
  488. });
  489. }
  490. #define PY_CLASS(mod, name) inline static PyVar _tp(VM* vm) { return vm->_modules[#mod]->attribs[#name]; }
  491. struct ReMatch {
  492. PY_CLASS(re, Match)
  493. i64 start;
  494. i64 end;
  495. std::smatch m;
  496. ReMatch(i64 start, i64 end, std::smatch m) : start(start), end(end), m(m) {}
  497. static PyVar _bind(VM* vm){
  498. PyVar _tp_match = vm->new_user_type_object(vm->_modules["re"], "Match", vm->_tp_object);
  499. vm->bindMethod<0>(_tp_match, "start", [](VM* vm, const pkpy::ArgList& args) {
  500. return vm->PyInt(UNION_GET(ReMatch, args[0]).start);
  501. });
  502. vm->bindMethod<0>(_tp_match, "end", [](VM* vm, const pkpy::ArgList& args) {
  503. return vm->PyInt(UNION_GET(ReMatch, args[0]).end);
  504. });
  505. vm->bindMethod<0>(_tp_match, "span", [](VM* vm, const pkpy::ArgList& args) {
  506. auto& m = UNION_GET(ReMatch, args[0]);
  507. PyVarList vec = { vm->PyInt(m.start), vm->PyInt(m.end) };
  508. return vm->PyTuple(vec);
  509. });
  510. vm->bindMethod<1>(_tp_match, "group", [](VM* vm, const pkpy::ArgList& args) {
  511. auto& m = UNION_GET(ReMatch, args[0]);
  512. int index = (int)vm->PyInt_AS_C(args[1]);
  513. index = vm->normalizedIndex(index, m.m.size());
  514. return vm->PyStr(m.m[index].str());
  515. });
  516. return _tp_match;
  517. }
  518. };
  519. // C绑定过程
  520. // 一个C原生类
  521. // static PyVar _tp(VM* vm); 实现从VM中获取该类的类型对象
  522. // static PyVar _bind(VM* vm); 实现初始化该类的绑定,在VM中注册该类的类型对象,并返回生成的类型对象
  523. PyVar __regex_search(const _Str& pattern, const _Str& string, bool fromStart, VM* vm){
  524. std::regex re(pattern);
  525. std::smatch m;
  526. if(std::regex_search(string, m, re)){
  527. if(fromStart && m.position() != 0) return vm->None;
  528. i64 start = string.__to_u8_index(m.position());
  529. i64 end = string.__to_u8_index(m.position() + m.length());
  530. return vm->new_object_c<ReMatch>(start, end, m);
  531. }
  532. return vm->None;
  533. };
  534. void __addModuleRe(VM* vm){
  535. PyVar mod = vm->newModule("re");
  536. ReMatch::_bind(vm);
  537. vm->bindFunc<2>(mod, "match", [](VM* vm, const pkpy::ArgList& args) {
  538. const _Str& pattern = vm->PyStr_AS_C(args[0]);
  539. const _Str& string = vm->PyStr_AS_C(args[1]);
  540. return __regex_search(pattern, string, true, vm);
  541. });
  542. vm->bindFunc<2>(mod, "search", [](VM* vm, const pkpy::ArgList& args) {
  543. const _Str& pattern = vm->PyStr_AS_C(args[0]);
  544. const _Str& string = vm->PyStr_AS_C(args[1]);
  545. return __regex_search(pattern, string, false, vm);
  546. });
  547. vm->bindFunc<3>(mod, "sub", [](VM* vm, const pkpy::ArgList& args) {
  548. const _Str& pattern = vm->PyStr_AS_C(args[0]);
  549. const _Str& repl = vm->PyStr_AS_C(args[1]);
  550. const _Str& string = vm->PyStr_AS_C(args[2]);
  551. std::regex re(pattern);
  552. return vm->PyStr(std::regex_replace(string, re, repl));
  553. });
  554. vm->bindFunc<2>(mod, "split", [](VM* vm, const pkpy::ArgList& args) {
  555. const _Str& pattern = vm->PyStr_AS_C(args[0]);
  556. const _Str& string = vm->PyStr_AS_C(args[1]);
  557. std::regex re(pattern);
  558. std::sregex_token_iterator it(string.begin(), string.end(), re, -1);
  559. std::sregex_token_iterator end;
  560. PyVarList vec;
  561. for(; it != end; ++it){
  562. vec.push_back(vm->PyStr(it->str()));
  563. }
  564. return vm->PyList(vec);
  565. });
  566. }
  567. class _PkExported{
  568. public:
  569. virtual ~_PkExported() = default;
  570. virtual void* get() = 0;
  571. };
  572. static std::vector<_PkExported*> _pkLookupTable;
  573. template<typename T>
  574. class PkExported : public _PkExported{
  575. T* _ptr;
  576. public:
  577. template<typename... Args>
  578. PkExported(Args&&... args) {
  579. _ptr = new T(std::forward<Args>(args)...);
  580. _pkLookupTable.push_back(this);
  581. }
  582. ~PkExported() override { delete _ptr; }
  583. void* get() override { return _ptr; }
  584. operator T*() { return _ptr; }
  585. };
  586. #define pkpy_allocate(T, ...) *(new PkExported<T>(__VA_ARGS__))
  587. extern "C" {
  588. __EXPORT
  589. /// Delete a pointer allocated by `pkpy_xxx_xxx`.
  590. /// It can be `VM*`, `REPL*`, `char*`, etc.
  591. ///
  592. /// !!!
  593. /// If the pointer is not allocated by `pkpy_xxx_xxx`, the behavior is undefined.
  594. /// For char*, you can also use trivial `delete` in your language.
  595. /// !!!
  596. void pkpy_delete(void* p){
  597. for(int i = 0; i < _pkLookupTable.size(); i++){
  598. if(_pkLookupTable[i]->get() == p){
  599. delete _pkLookupTable[i];
  600. _pkLookupTable.erase(_pkLookupTable.begin() + i);
  601. return;
  602. }
  603. }
  604. free(p);
  605. }
  606. __EXPORT
  607. /// Run a given source on a virtual machine.
  608. void pkpy_vm_exec(VM* vm, const char* source){
  609. vm->exec(source, "main.py", EXEC_MODE);
  610. }
  611. __EXPORT
  612. /// Get a global variable of a virtual machine.
  613. ///
  614. /// Return a json representing the result.
  615. /// If the variable is not found, return `nullptr`.
  616. char* pkpy_vm_get_global(VM* vm, const char* name){
  617. auto it = vm->_main->attribs.find(name);
  618. if(it == vm->_main->attribs.end()) return nullptr;
  619. try{
  620. _Str _json = vm->PyStr_AS_C(vm->asJson(it->second));
  621. return strdup(_json.c_str());
  622. }catch(...){
  623. return nullptr;
  624. }
  625. }
  626. __EXPORT
  627. /// Evaluate an expression.
  628. ///
  629. /// Return a json representing the result.
  630. /// If there is any error, return `nullptr`.
  631. char* pkpy_vm_eval(VM* vm, const char* source){
  632. PyVarOrNull ret = vm->exec(source, "<eval>", EVAL_MODE);
  633. if(ret == nullptr) return nullptr;
  634. try{
  635. _Str _json = vm->PyStr_AS_C(vm->asJson(ret));
  636. return strdup(_json.c_str());
  637. }catch(...){
  638. return nullptr;
  639. }
  640. }
  641. __EXPORT
  642. /// Create a REPL, using the given virtual machine as the backend.
  643. REPL* pkpy_new_repl(VM* vm){
  644. return pkpy_allocate(REPL, vm);
  645. }
  646. __EXPORT
  647. /// Input a source line to an interactive console.
  648. int pkpy_repl_input(REPL* r, const char* line){
  649. return r->input(line);
  650. }
  651. __EXPORT
  652. /// Add a source module into a virtual machine.
  653. void pkpy_vm_add_module(VM* vm, const char* name, const char* source){
  654. vm->addLazyModule(name, source);
  655. }
  656. void __vm_init(VM* vm){
  657. __initializeBuiltinFunctions(vm);
  658. __addModuleSys(vm);
  659. __addModuleTime(vm);
  660. __addModuleJson(vm);
  661. __addModuleMath(vm);
  662. __addModuleRe(vm);
  663. // add builtins | no exception handler | must succeed
  664. _Code code = vm->compile(__BUILTINS_CODE, "<builtins>", EXEC_MODE);
  665. vm->_exec(code, vm->builtins, {});
  666. pkpy_vm_add_module(vm, "random", __RANDOM_CODE);
  667. pkpy_vm_add_module(vm, "os", __OS_CODE);
  668. }
  669. __EXPORT
  670. /// Create a virtual machine.
  671. VM* pkpy_new_vm(bool use_stdio){
  672. VM* vm = pkpy_allocate(VM, use_stdio);
  673. __vm_init(vm);
  674. return vm;
  675. }
  676. __EXPORT
  677. /// Read the standard output and standard error as string of a virtual machine.
  678. /// The `vm->use_stdio` should be `false`.
  679. /// After this operation, both stream will be cleared.
  680. ///
  681. /// Return a json representing the result.
  682. char* pkpy_vm_read_output(VM* vm){
  683. if(vm->use_stdio) return nullptr;
  684. _StrStream* s_out = (_StrStream*)(vm->_stdout);
  685. _StrStream* s_err = (_StrStream*)(vm->_stderr);
  686. _Str _stdout = s_out->str();
  687. _Str _stderr = s_err->str();
  688. _StrStream ss;
  689. ss << '{' << "\"stdout\": " << _stdout.__escape(false);
  690. ss << ", ";
  691. ss << "\"stderr\": " << _stderr.__escape(false) << '}';
  692. s_out->str("");
  693. s_err->str("");
  694. return strdup(ss.str().c_str());
  695. }
  696. }