pocketpy.h 31 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797
  1. #pragma once
  2. #include "vm.h"
  3. #include "compiler.h"
  4. #include "repl.h"
  5. _Code VM::compile(_Str source, _Str filename, CompileMode mode) {
  6. Compiler compiler(this, source.c_str(), filename, mode);
  7. try{
  8. return compiler.__fillCode();
  9. }catch(_Exception& e){
  10. _error(e);
  11. return nullptr;
  12. }
  13. }
  14. #define BIND_NUM_ARITH_OPT(name, op) \
  15. _vm->bindMethodMulti<1>({"int","float"}, #name, [](VM* vm, const pkpy::Args& args){ \
  16. if(args[0]->is_type(vm->_tp_int) && args[1]->is_type(vm->_tp_int)){ \
  17. return vm->PyInt(vm->PyInt_AS_C(args[0]) op vm->PyInt_AS_C(args[1])); \
  18. }else{ \
  19. return vm->PyFloat(vm->num_to_float(args[0]) op vm->num_to_float(args[1])); \
  20. } \
  21. });
  22. #define BIND_NUM_LOGICAL_OPT(name, op, is_eq) \
  23. _vm->bindMethodMulti<1>({"int","float"}, #name, [](VM* vm, const pkpy::Args& args){ \
  24. bool _0 = args[0]->is_type(vm->_tp_int) || args[0]->is_type(vm->_tp_float); \
  25. bool _1 = args[1]->is_type(vm->_tp_int) || args[1]->is_type(vm->_tp_float); \
  26. if(!_0 || !_1){ \
  27. if constexpr(is_eq) return vm->PyBool(args[0].get() op args[1].get()); \
  28. vm->typeError("unsupported operand type(s) for " #op ); \
  29. } \
  30. return vm->PyBool(vm->num_to_float(args[0]) op vm->num_to_float(args[1])); \
  31. });
  32. void __initializeBuiltinFunctions(VM* _vm) {
  33. BIND_NUM_ARITH_OPT(__add__, +)
  34. BIND_NUM_ARITH_OPT(__sub__, -)
  35. BIND_NUM_ARITH_OPT(__mul__, *)
  36. BIND_NUM_LOGICAL_OPT(__lt__, <, false)
  37. BIND_NUM_LOGICAL_OPT(__le__, <=, false)
  38. BIND_NUM_LOGICAL_OPT(__gt__, >, false)
  39. BIND_NUM_LOGICAL_OPT(__ge__, >=, false)
  40. BIND_NUM_LOGICAL_OPT(__eq__, ==, true)
  41. BIND_NUM_LOGICAL_OPT(__ne__, !=, true)
  42. #undef BIND_NUM_ARITH_OPT
  43. #undef BIND_NUM_LOGICAL_OPT
  44. _vm->bindBuiltinFunc<1>("__sys_stdout_write", [](VM* vm, const pkpy::Args& args) {
  45. (*vm->_stdout) << vm->PyStr_AS_C(args[0]);
  46. return vm->None;
  47. });
  48. _vm->bindBuiltinFunc<0>("super", [](VM* vm, const pkpy::Args& args) {
  49. auto it = vm->top_frame()->f_locals().find(m_self);
  50. if(it == vm->top_frame()->f_locals().end()) vm->typeError("super() can only be called in a class method");
  51. return vm->new_object(vm->_tp_super, it->second);
  52. });
  53. _vm->bindBuiltinFunc<1>("eval", [](VM* vm, const pkpy::Args& args) {
  54. _Code code = vm->compile(vm->PyStr_AS_C(args[0]), "<eval>", EVAL_MODE);
  55. return vm->_exec(code, vm->top_frame()->_module, vm->top_frame()->_locals);
  56. });
  57. _vm->bindBuiltinFunc<1>("exec", [](VM* vm, const pkpy::Args& args) {
  58. _Code code = vm->compile(vm->PyStr_AS_C(args[0]), "<exec>", EXEC_MODE);
  59. vm->_exec(code, vm->top_frame()->_module, vm->top_frame()->_locals);
  60. return vm->None;
  61. });
  62. _vm->bindBuiltinFunc<-1>("exit", [](VM* vm, const pkpy::Args& args) {
  63. if(args.size() == 0) std::exit(0);
  64. else if(args.size() == 1) std::exit(vm->PyInt_AS_C(args[0]));
  65. else vm->typeError("exit() takes at most 1 argument");
  66. return vm->None;
  67. });
  68. _vm->bindBuiltinFunc<1>("repr", CPP_LAMBDA(vm->asRepr(args[0])));
  69. _vm->bindBuiltinFunc<1>("hash", CPP_LAMBDA(vm->PyInt(vm->hash(args[0]))));
  70. _vm->bindBuiltinFunc<1>("len", CPP_LAMBDA(vm->call(args[0], __len__, pkpy::noArg())));
  71. _vm->bindBuiltinFunc<1>("chr", [](VM* vm, const pkpy::Args& args) {
  72. i64 i = vm->PyInt_AS_C(args[0]);
  73. if (i < 0 || i > 128) vm->valueError("chr() arg not in range(128)");
  74. return vm->PyStr(std::string(1, (char)i));
  75. });
  76. _vm->bindBuiltinFunc<1>("ord", [](VM* vm, const pkpy::Args& args) {
  77. _Str s = vm->PyStr_AS_C(args[0]);
  78. if (s.size() != 1) vm->typeError("ord() expected an ASCII character");
  79. return vm->PyInt((i64)(s.c_str()[0]));
  80. });
  81. _vm->bindBuiltinFunc<2>("hasattr", [](VM* vm, const pkpy::Args& args) {
  82. return vm->PyBool(vm->getattr(args[0], vm->PyStr_AS_C(args[1]), false) != nullptr);
  83. });
  84. _vm->bindBuiltinFunc<3>("setattr", [](VM* vm, const pkpy::Args& args) {
  85. PyVar obj = args[0];
  86. vm->setattr(obj, vm->PyStr_AS_C(args[1]), args[2]);
  87. return vm->None;
  88. });
  89. _vm->bindBuiltinFunc<2>("getattr", [](VM* vm, const pkpy::Args& args) {
  90. _Str name = vm->PyStr_AS_C(args[1]);
  91. return vm->getattr(args[0], name);
  92. });
  93. _vm->bindBuiltinFunc<1>("hex", [](VM* vm, const pkpy::Args& args) {
  94. std::stringstream ss;
  95. ss << std::hex << vm->PyInt_AS_C(args[0]);
  96. return vm->PyStr("0x" + ss.str());
  97. });
  98. _vm->bindBuiltinFunc<1>("dir", [](VM* vm, const pkpy::Args& args) {
  99. std::vector<_Str> names;
  100. for (auto& [k, _] : args[0]->attribs) names.push_back(k);
  101. for (auto& [k, _] : args[0]->type->attribs) {
  102. if (k.find("__") == 0) continue;
  103. if (std::find(names.begin(), names.end(), k) == names.end()) names.push_back(k);
  104. }
  105. PyVarList ret;
  106. for (const auto& name : names) ret.push_back(vm->PyStr(name));
  107. std::sort(ret.begin(), ret.end(), [vm](const PyVar& a, const PyVar& b) {
  108. return vm->PyStr_AS_C(a) < vm->PyStr_AS_C(b);
  109. });
  110. return vm->PyList(ret);
  111. });
  112. _vm->bindMethod<0>("object", "__repr__", [](VM* vm, const pkpy::Args& args) {
  113. PyVar _self = args[0];
  114. std::stringstream ss;
  115. ss << std::hex << (uintptr_t)_self.get();
  116. _Str s = "<" + OBJ_TP_NAME(_self) + " object at 0x" + ss.str() + ">";
  117. return vm->PyStr(s);
  118. });
  119. _vm->bindMethod<1>("object", "__eq__", CPP_LAMBDA(vm->PyBool(args[0] == args[1])));
  120. _vm->bindMethod<1>("object", "__ne__", CPP_LAMBDA(vm->PyBool(args[0] != args[1])));
  121. _vm->bindStaticMethod<1>("type", "__new__", CPP_LAMBDA(args[0]->type));
  122. _vm->bindStaticMethod<-1>("range", "__new__", [](VM* vm, const pkpy::Args& args) {
  123. _Range r;
  124. switch (args.size()) {
  125. case 1: r.stop = vm->PyInt_AS_C(args[0]); break;
  126. case 2: r.start = vm->PyInt_AS_C(args[0]); r.stop = vm->PyInt_AS_C(args[1]); break;
  127. case 3: r.start = vm->PyInt_AS_C(args[0]); r.stop = vm->PyInt_AS_C(args[1]); r.step = vm->PyInt_AS_C(args[2]); break;
  128. default: vm->typeError("expected 1-3 arguments, but got " + std::to_string(args.size()));
  129. }
  130. return vm->PyRange(r);
  131. });
  132. _vm->bindMethod<0>("range", "__iter__", CPP_LAMBDA(
  133. vm->PyIter(pkpy::make_shared<BaseIterator, RangeIterator>(vm, args[0]))
  134. ));
  135. _vm->bindMethod<0>("NoneType", "__repr__", CPP_LAMBDA(vm->PyStr("None")));
  136. _vm->bindMethod<0>("NoneType", "__json__", CPP_LAMBDA(vm->PyStr("null")));
  137. _vm->bindMethodMulti<1>({"int", "float"}, "__truediv__", [](VM* vm, const pkpy::Args& args) {
  138. f64 rhs = vm->num_to_float(args[1]);
  139. if (rhs == 0) vm->zeroDivisionError();
  140. return vm->PyFloat(vm->num_to_float(args[0]) / rhs);
  141. });
  142. _vm->bindMethodMulti<1>({"int", "float"}, "__pow__", [](VM* vm, const pkpy::Args& args) {
  143. if(args[0]->is_type(vm->_tp_int) && args[1]->is_type(vm->_tp_int)){
  144. return vm->PyInt((i64)round(pow(vm->PyInt_AS_C(args[0]), vm->PyInt_AS_C(args[1]))));
  145. }else{
  146. return vm->PyFloat((f64)pow(vm->num_to_float(args[0]), vm->num_to_float(args[1])));
  147. }
  148. });
  149. /************ PyInt ************/
  150. _vm->bindStaticMethod<1>("int", "__new__", [](VM* vm, const pkpy::Args& args) {
  151. if (args[0]->is_type(vm->_tp_int)) return args[0];
  152. if (args[0]->is_type(vm->_tp_float)) return vm->PyInt((i64)vm->PyFloat_AS_C(args[0]));
  153. if (args[0]->is_type(vm->_tp_bool)) return vm->PyInt(vm->PyBool_AS_C(args[0]) ? 1 : 0);
  154. if (args[0]->is_type(vm->_tp_str)) {
  155. const _Str& s = vm->PyStr_AS_C(args[0]);
  156. try{
  157. size_t parsed = 0;
  158. i64 val = std::stoll(s, &parsed, 10);
  159. if(parsed != s.size()) throw std::invalid_argument("");
  160. return vm->PyInt(val);
  161. }catch(std::invalid_argument&){
  162. vm->valueError("invalid literal for int(): '" + s + "'");
  163. }
  164. }
  165. vm->typeError("int() argument must be a int, float, bool or str");
  166. return vm->None;
  167. });
  168. _vm->bindMethod<1>("int", "__floordiv__", [](VM* vm, const pkpy::Args& args) {
  169. i64 rhs = vm->PyInt_AS_C(args[1]);
  170. if(rhs == 0) vm->zeroDivisionError();
  171. return vm->PyInt(vm->PyInt_AS_C(args[0]) / rhs);
  172. });
  173. _vm->bindMethod<1>("int", "__mod__", [](VM* vm, const pkpy::Args& args) {
  174. i64 rhs = vm->PyInt_AS_C(args[1]);
  175. if(rhs == 0) vm->zeroDivisionError();
  176. return vm->PyInt(vm->PyInt_AS_C(args[0]) % rhs);
  177. });
  178. _vm->bindMethod<0>("int", "__repr__", [](VM* vm, const pkpy::Args& args) {
  179. return vm->PyStr(std::to_string(vm->PyInt_AS_C(args[0])));
  180. });
  181. _vm->bindMethod<0>("int", "__json__", [](VM* vm, const pkpy::Args& args) {
  182. return vm->PyStr(std::to_string((int)vm->PyInt_AS_C(args[0])));
  183. });
  184. #define __INT_BITWISE_OP(name,op) \
  185. _vm->bindMethod<1>("int", #name, [](VM* vm, const pkpy::Args& args) { \
  186. return vm->PyInt(vm->PyInt_AS_C(args[0]) op vm->PyInt_AS_C(args[1])); \
  187. });
  188. __INT_BITWISE_OP(__lshift__, <<)
  189. __INT_BITWISE_OP(__rshift__, >>)
  190. __INT_BITWISE_OP(__and__, &)
  191. __INT_BITWISE_OP(__or__, |)
  192. __INT_BITWISE_OP(__xor__, ^)
  193. #undef __INT_BITWISE_OP
  194. /************ PyFloat ************/
  195. _vm->bindStaticMethod<1>("float", "__new__", [](VM* vm, const pkpy::Args& args) {
  196. if (args[0]->is_type(vm->_tp_int)) return vm->PyFloat((f64)vm->PyInt_AS_C(args[0]));
  197. if (args[0]->is_type(vm->_tp_float)) return args[0];
  198. if (args[0]->is_type(vm->_tp_bool)) return vm->PyFloat(vm->PyBool_AS_C(args[0]) ? 1.0 : 0.0);
  199. if (args[0]->is_type(vm->_tp_str)) {
  200. const _Str& s = vm->PyStr_AS_C(args[0]);
  201. if(s == "inf") return vm->PyFloat(INFINITY);
  202. if(s == "-inf") return vm->PyFloat(-INFINITY);
  203. try{
  204. f64 val = std::stod(s);
  205. return vm->PyFloat(val);
  206. }catch(std::invalid_argument&){
  207. vm->valueError("invalid literal for float(): '" + s + "'");
  208. }
  209. }
  210. vm->typeError("float() argument must be a int, float, bool or str");
  211. return vm->None;
  212. });
  213. _vm->bindMethod<0>("float", "__repr__", [](VM* vm, const pkpy::Args& args) {
  214. f64 val = vm->PyFloat_AS_C(args[0]);
  215. if(std::isinf(val) || std::isnan(val)) return vm->PyStr(std::to_string(val));
  216. _StrStream ss;
  217. ss << std::setprecision(std::numeric_limits<f64>::max_digits10-1) << val;
  218. std::string s = ss.str();
  219. if(std::all_of(s.begin()+1, s.end(), isdigit)) s += ".0";
  220. return vm->PyStr(s);
  221. });
  222. _vm->bindMethod<0>("float", "__json__", [](VM* vm, const pkpy::Args& args) {
  223. f64 val = vm->PyFloat_AS_C(args[0]);
  224. if(std::isinf(val) || std::isnan(val)) vm->valueError("cannot jsonify 'nan' or 'inf'");
  225. return vm->PyStr(std::to_string(val));
  226. });
  227. /************ PyString ************/
  228. _vm->bindStaticMethod<1>("str", "__new__", CPP_LAMBDA(vm->asStr(args[0])));
  229. _vm->bindMethod<1>("str", "__add__", [](VM* vm, const pkpy::Args& args) {
  230. const _Str& lhs = vm->PyStr_AS_C(args[0]);
  231. const _Str& rhs = vm->PyStr_AS_C(args[1]);
  232. return vm->PyStr(lhs + rhs);
  233. });
  234. _vm->bindMethod<0>("str", "__len__", [](VM* vm, const pkpy::Args& args) {
  235. const _Str& _self = vm->PyStr_AS_C(args[0]);
  236. return vm->PyInt(_self.u8_length());
  237. });
  238. _vm->bindMethod<1>("str", "__contains__", [](VM* vm, const pkpy::Args& args) {
  239. const _Str& _self = vm->PyStr_AS_C(args[0]);
  240. const _Str& _other = vm->PyStr_AS_C(args[1]);
  241. return vm->PyBool(_self.find(_other) != _Str::npos);
  242. });
  243. _vm->bindMethod<0>("str", "__str__", CPP_LAMBDA(args[0]));
  244. _vm->bindMethod<0>("str", "__iter__", CPP_LAMBDA(
  245. vm->PyIter(pkpy::make_shared<BaseIterator, StringIterator>(vm, args[0]))
  246. ));
  247. _vm->bindMethod<0>("str", "__repr__", [](VM* vm, const pkpy::Args& args) {
  248. const _Str& _self = vm->PyStr_AS_C(args[0]);
  249. return vm->PyStr(_self.__escape(true));
  250. });
  251. _vm->bindMethod<0>("str", "__json__", [](VM* vm, const pkpy::Args& args) {
  252. const _Str& _self = vm->PyStr_AS_C(args[0]);
  253. return vm->PyStr(_self.__escape(false));
  254. });
  255. _vm->bindMethod<1>("str", "__eq__", [](VM* vm, const pkpy::Args& args) {
  256. if(args[0]->is_type(vm->_tp_str) && args[1]->is_type(vm->_tp_str))
  257. return vm->PyBool(vm->PyStr_AS_C(args[0]) == vm->PyStr_AS_C(args[1]));
  258. return vm->PyBool(args[0] == args[1]);
  259. });
  260. _vm->bindMethod<1>("str", "__ne__", [](VM* vm, const pkpy::Args& args) {
  261. if(args[0]->is_type(vm->_tp_str) && args[1]->is_type(vm->_tp_str))
  262. return vm->PyBool(vm->PyStr_AS_C(args[0]) != vm->PyStr_AS_C(args[1]));
  263. return vm->PyBool(args[0] != args[1]);
  264. });
  265. _vm->bindMethod<1>("str", "__getitem__", [](VM* vm, const pkpy::Args& args) {
  266. const _Str& _self (vm->PyStr_AS_C(args[0]));
  267. if(args[1]->is_type(vm->_tp_slice)){
  268. _Slice s = vm->PySlice_AS_C(args[1]);
  269. s.normalize(_self.u8_length());
  270. return vm->PyStr(_self.u8_substr(s.start, s.stop));
  271. }
  272. int _index = (int)vm->PyInt_AS_C(args[1]);
  273. _index = vm->normalized_index(_index, _self.u8_length());
  274. return vm->PyStr(_self.u8_getitem(_index));
  275. });
  276. _vm->bindMethod<1>("str", "__gt__", [](VM* vm, const pkpy::Args& args) {
  277. const _Str& _self (vm->PyStr_AS_C(args[0]));
  278. const _Str& _obj (vm->PyStr_AS_C(args[1]));
  279. return vm->PyBool(_self > _obj);
  280. });
  281. _vm->bindMethod<1>("str", "__lt__", [](VM* vm, const pkpy::Args& args) {
  282. const _Str& _self (vm->PyStr_AS_C(args[0]));
  283. const _Str& _obj (vm->PyStr_AS_C(args[1]));
  284. return vm->PyBool(_self < _obj);
  285. });
  286. _vm->bindMethod<2>("str", "replace", [](VM* vm, const pkpy::Args& args) {
  287. const _Str& _self = vm->PyStr_AS_C(args[0]);
  288. const _Str& _old = vm->PyStr_AS_C(args[1]);
  289. const _Str& _new = vm->PyStr_AS_C(args[2]);
  290. _Str _copy = _self;
  291. // replace all occurences of _old with _new in _copy
  292. size_t pos = 0;
  293. while ((pos = _copy.find(_old, pos)) != std::string::npos) {
  294. _copy.replace(pos, _old.length(), _new);
  295. pos += _new.length();
  296. }
  297. return vm->PyStr(_copy);
  298. });
  299. _vm->bindMethod<1>("str", "startswith", [](VM* vm, const pkpy::Args& args) {
  300. const _Str& _self = vm->PyStr_AS_C(args[0]);
  301. const _Str& _prefix = vm->PyStr_AS_C(args[1]);
  302. return vm->PyBool(_self.find(_prefix) == 0);
  303. });
  304. _vm->bindMethod<1>("str", "endswith", [](VM* vm, const pkpy::Args& args) {
  305. const _Str& _self = vm->PyStr_AS_C(args[0]);
  306. const _Str& _suffix = vm->PyStr_AS_C(args[1]);
  307. return vm->PyBool(_self.rfind(_suffix) == _self.length() - _suffix.length());
  308. });
  309. _vm->bindMethod<1>("str", "join", [](VM* vm, const pkpy::Args& args) {
  310. const _Str& _self = vm->PyStr_AS_C(args[0]);
  311. PyVarList* _list = nullptr;
  312. if(args[1]->is_type(vm->_tp_list)){
  313. _list = &vm->PyList_AS_C(args[1]);
  314. }else if(args[1]->is_type(vm->_tp_tuple)){
  315. _list = &vm->PyTuple_AS_C(args[1]);
  316. }else{
  317. vm->typeError("can only join a list or tuple");
  318. }
  319. _StrStream ss;
  320. for(int i = 0; i < _list->size(); i++){
  321. if(i > 0) ss << _self;
  322. ss << vm->PyStr_AS_C(vm->asStr(_list->operator[](i)));
  323. }
  324. return vm->PyStr(ss.str());
  325. });
  326. /************ PyList ************/
  327. _vm->bindMethod<0>("list", "__iter__", [](VM* vm, const pkpy::Args& args) {
  328. return vm->PyIter(
  329. pkpy::make_shared<BaseIterator, VectorIterator>(vm, args[0])
  330. );
  331. });
  332. _vm->bindMethod<1>("list", "append", [](VM* vm, const pkpy::Args& args) {
  333. PyVarList& _self = vm->PyList_AS_C(args[0]);
  334. _self.push_back(args[1]);
  335. return vm->None;
  336. });
  337. _vm->bindMethod<2>("list", "insert", [](VM* vm, const pkpy::Args& args) {
  338. PyVarList& _self = vm->PyList_AS_C(args[0]);
  339. int _index = (int)vm->PyInt_AS_C(args[1]);
  340. if(_index < 0) _index += _self.size();
  341. if(_index < 0) _index = 0;
  342. if(_index > _self.size()) _index = _self.size();
  343. _self.insert(_self.begin() + _index, args[2]);
  344. return vm->None;
  345. });
  346. _vm->bindMethod<0>("list", "clear", [](VM* vm, const pkpy::Args& args) {
  347. vm->PyList_AS_C(args[0]).clear();
  348. return vm->None;
  349. });
  350. _vm->bindMethod<0>("list", "copy", [](VM* vm, const pkpy::Args& args) {
  351. return vm->PyList(vm->PyList_AS_C(args[0]));
  352. });
  353. _vm->bindMethod<1>("list", "__add__", [](VM* vm, const pkpy::Args& args) {
  354. const PyVarList& _self = vm->PyList_AS_C(args[0]);
  355. const PyVarList& _obj = vm->PyList_AS_C(args[1]);
  356. PyVarList _new_list = _self;
  357. _new_list.insert(_new_list.end(), _obj.begin(), _obj.end());
  358. return vm->PyList(_new_list);
  359. });
  360. _vm->bindMethod<0>("list", "__len__", [](VM* vm, const pkpy::Args& args) {
  361. const PyVarList& _self = vm->PyList_AS_C(args[0]);
  362. return vm->PyInt(_self.size());
  363. });
  364. _vm->bindMethodMulti<1>({"list", "tuple"}, "__getitem__", [](VM* vm, const pkpy::Args& args) {
  365. bool list = args[0]->is_type(vm->_tp_list);
  366. const PyVarList& _self = list ? vm->PyList_AS_C(args[0]) : vm->PyTuple_AS_C(args[0]);
  367. if(args[1]->is_type(vm->_tp_slice)){
  368. _Slice s = vm->PySlice_AS_C(args[1]);
  369. s.normalize(_self.size());
  370. PyVarList _new_list;
  371. for(size_t i = s.start; i < s.stop; i++) _new_list.push_back(_self[i]);
  372. return list ? vm->PyList(_new_list) : vm->PyTuple(_new_list);
  373. }
  374. int _index = (int)vm->PyInt_AS_C(args[1]);
  375. _index = vm->normalized_index(_index, _self.size());
  376. return _self[_index];
  377. });
  378. _vm->bindMethod<2>("list", "__setitem__", [](VM* vm, const pkpy::Args& args) {
  379. PyVarList& _self = vm->PyList_AS_C(args[0]);
  380. int _index = (int)vm->PyInt_AS_C(args[1]);
  381. _index = vm->normalized_index(_index, _self.size());
  382. _self[_index] = args[2];
  383. return vm->None;
  384. });
  385. _vm->bindMethod<1>("list", "__delitem__", [](VM* vm, const pkpy::Args& args) {
  386. PyVarList& _self = vm->PyList_AS_C(args[0]);
  387. int _index = (int)vm->PyInt_AS_C(args[1]);
  388. _index = vm->normalized_index(_index, _self.size());
  389. _self.erase(_self.begin() + _index);
  390. return vm->None;
  391. });
  392. /************ PyTuple ************/
  393. _vm->bindStaticMethod<1>("tuple", "__new__", [](VM* vm, const pkpy::Args& args) {
  394. PyVarList _list = vm->PyList_AS_C(vm->call(vm->builtins->attribs["list"], args));
  395. return vm->PyTuple(_list);
  396. });
  397. _vm->bindMethod<0>("tuple", "__iter__", [](VM* vm, const pkpy::Args& args) {
  398. return vm->PyIter(pkpy::make_shared<BaseIterator, VectorIterator>(vm, args[0]));
  399. });
  400. _vm->bindMethod<0>("tuple", "__len__", [](VM* vm, const pkpy::Args& args) {
  401. const PyVarList& _self = vm->PyTuple_AS_C(args[0]);
  402. return vm->PyInt(_self.size());
  403. });
  404. /************ PyBool ************/
  405. _vm->bindStaticMethod<1>("bool", "__new__", CPP_LAMBDA(vm->asBool(args[0])));
  406. _vm->bindMethod<0>("bool", "__repr__", [](VM* vm, const pkpy::Args& args) {
  407. bool val = vm->PyBool_AS_C(args[0]);
  408. return vm->PyStr(val ? "True" : "False");
  409. });
  410. _vm->bindMethod<0>("bool", "__json__", [](VM* vm, const pkpy::Args& args) {
  411. bool val = vm->PyBool_AS_C(args[0]);
  412. return vm->PyStr(val ? "true" : "false");
  413. });
  414. _vm->bindMethod<1>("bool", "__xor__", [](VM* vm, const pkpy::Args& args) {
  415. bool _self = vm->PyBool_AS_C(args[0]);
  416. bool _obj = vm->PyBool_AS_C(args[1]);
  417. return vm->PyBool(_self ^ _obj);
  418. });
  419. _vm->bindMethod<0>("ellipsis", "__repr__", CPP_LAMBDA(vm->PyStr("Ellipsis")));
  420. }
  421. #include "builtins.h"
  422. #ifdef _WIN32
  423. #define __EXPORT __declspec(dllexport)
  424. #elif __APPLE__
  425. #define __EXPORT __attribute__((visibility("default"))) __attribute__((used))
  426. #elif __EMSCRIPTEN__
  427. #define __EXPORT EMSCRIPTEN_KEEPALIVE
  428. #define __NO_MAIN
  429. #else
  430. #define __EXPORT
  431. #endif
  432. void __add_module_time(VM* vm){
  433. PyVar mod = vm->new_module("time");
  434. vm->bindFunc<0>(mod, "time", [](VM* vm, const pkpy::Args& args) {
  435. auto now = std::chrono::high_resolution_clock::now();
  436. return vm->PyFloat(std::chrono::duration_cast<std::chrono::microseconds>(now.time_since_epoch()).count() / 1000000.0);
  437. });
  438. }
  439. void __add_module_sys(VM* vm){
  440. PyVar mod = vm->new_module("sys");
  441. vm->bindFunc<1>(mod, "getrefcount", [](VM* vm, const pkpy::Args& args) {
  442. return vm->PyInt(args[0].use_count());
  443. });
  444. vm->bindFunc<0>(mod, "getrecursionlimit", [](VM* vm, const pkpy::Args& args) {
  445. return vm->PyInt(vm->maxRecursionDepth);
  446. });
  447. vm->bindFunc<1>(mod, "setrecursionlimit", [](VM* vm, const pkpy::Args& args) {
  448. vm->maxRecursionDepth = (int)vm->PyInt_AS_C(args[0]);
  449. return vm->None;
  450. });
  451. vm->setattr(mod, "version", vm->PyStr(PK_VERSION));
  452. }
  453. void __add_module_json(VM* vm){
  454. PyVar mod = vm->new_module("json");
  455. vm->bindFunc<1>(mod, "loads", [](VM* vm, const pkpy::Args& args) {
  456. const _Str& expr = vm->PyStr_AS_C(args[0]);
  457. _Code code = vm->compile(expr, "<json>", JSON_MODE);
  458. return vm->_exec(code, vm->top_frame()->_module, vm->top_frame()->_locals);
  459. });
  460. vm->bindFunc<1>(mod, "dumps", CPP_LAMBDA(vm->call(args[0], __json__)));
  461. }
  462. void __add_module_math(VM* vm){
  463. PyVar mod = vm->new_module("math");
  464. vm->setattr(mod, "pi", vm->PyFloat(3.1415926535897932384));
  465. vm->setattr(mod, "e" , vm->PyFloat(2.7182818284590452354));
  466. vm->bindFunc<1>(mod, "log", CPP_LAMBDA(vm->PyFloat(log(vm->num_to_float(args[0])))));
  467. vm->bindFunc<1>(mod, "log10", CPP_LAMBDA(vm->PyFloat(log10(vm->num_to_float(args[0])))));
  468. vm->bindFunc<1>(mod, "log2", CPP_LAMBDA(vm->PyFloat(log2(vm->num_to_float(args[0])))));
  469. vm->bindFunc<1>(mod, "sin", CPP_LAMBDA(vm->PyFloat(sin(vm->num_to_float(args[0])))));
  470. vm->bindFunc<1>(mod, "cos", CPP_LAMBDA(vm->PyFloat(cos(vm->num_to_float(args[0])))));
  471. vm->bindFunc<1>(mod, "tan", CPP_LAMBDA(vm->PyFloat(tan(vm->num_to_float(args[0])))));
  472. vm->bindFunc<1>(mod, "isnan", CPP_LAMBDA(vm->PyBool(std::isnan(vm->num_to_float(args[0])))));
  473. vm->bindFunc<1>(mod, "isinf", CPP_LAMBDA(vm->PyBool(std::isinf(vm->num_to_float(args[0])))));
  474. }
  475. void __add_module_dis(VM* vm){
  476. PyVar mod = vm->new_module("dis");
  477. vm->bindFunc<1>(mod, "dis", [](VM* vm, const pkpy::Args& args) {
  478. _Code code = vm->PyFunction_AS_C(args[0])->code;
  479. (*vm->_stdout) << vm->disassemble(code);
  480. return vm->None;
  481. });
  482. }
  483. #define PY_CLASS(mod, name) inline static PyVar _tp(VM* vm) { return vm->_modules[#mod]->attribs[#name]; }
  484. struct ReMatch {
  485. PY_CLASS(re, Match)
  486. i64 start;
  487. i64 end;
  488. std::smatch m;
  489. ReMatch(i64 start, i64 end, std::smatch m) : start(start), end(end), m(m) {}
  490. static PyVar _bind(VM* vm){
  491. PyVar _tp_match = vm->new_user_type_object(vm->_modules["re"], "Match", vm->_tp_object);
  492. vm->bindMethod<0>(_tp_match, "start", CPP_LAMBDA(vm->PyInt(OBJ_GET(ReMatch, args[0]).start)));
  493. vm->bindMethod<0>(_tp_match, "end", CPP_LAMBDA(vm->PyInt(OBJ_GET(ReMatch, args[0]).end)));
  494. vm->bindMethod<0>(_tp_match, "span", [](VM* vm, const pkpy::Args& args) {
  495. auto& m = OBJ_GET(ReMatch, args[0]);
  496. return vm->PyTuple({ vm->PyInt(m.start), vm->PyInt(m.end) });
  497. });
  498. vm->bindMethod<1>(_tp_match, "group", [](VM* vm, const pkpy::Args& args) {
  499. auto& m = OBJ_GET(ReMatch, args[0]);
  500. int index = (int)vm->PyInt_AS_C(args[1]);
  501. index = vm->normalized_index(index, m.m.size());
  502. return vm->PyStr(m.m[index].str());
  503. });
  504. return _tp_match;
  505. }
  506. };
  507. PyVar __regex_search(const _Str& pattern, const _Str& string, bool fromStart, VM* vm){
  508. std::regex re(pattern);
  509. std::smatch m;
  510. if(std::regex_search(string, m, re)){
  511. if(fromStart && m.position() != 0) return vm->None;
  512. i64 start = string.__to_u8_index(m.position());
  513. i64 end = string.__to_u8_index(m.position() + m.length());
  514. return vm->new_object_c<ReMatch>(start, end, m);
  515. }
  516. return vm->None;
  517. };
  518. void __add_module_re(VM* vm){
  519. PyVar mod = vm->new_module("re");
  520. ReMatch::_bind(vm);
  521. vm->bindFunc<2>(mod, "match", [](VM* vm, const pkpy::Args& args) {
  522. const _Str& pattern = vm->PyStr_AS_C(args[0]);
  523. const _Str& string = vm->PyStr_AS_C(args[1]);
  524. return __regex_search(pattern, string, true, vm);
  525. });
  526. vm->bindFunc<2>(mod, "search", [](VM* vm, const pkpy::Args& args) {
  527. const _Str& pattern = vm->PyStr_AS_C(args[0]);
  528. const _Str& string = vm->PyStr_AS_C(args[1]);
  529. return __regex_search(pattern, string, false, vm);
  530. });
  531. vm->bindFunc<3>(mod, "sub", [](VM* vm, const pkpy::Args& args) {
  532. const _Str& pattern = vm->PyStr_AS_C(args[0]);
  533. const _Str& repl = vm->PyStr_AS_C(args[1]);
  534. const _Str& string = vm->PyStr_AS_C(args[2]);
  535. std::regex re(pattern);
  536. return vm->PyStr(std::regex_replace(string, re, repl));
  537. });
  538. vm->bindFunc<2>(mod, "split", [](VM* vm, const pkpy::Args& args) {
  539. const _Str& pattern = vm->PyStr_AS_C(args[0]);
  540. const _Str& string = vm->PyStr_AS_C(args[1]);
  541. std::regex re(pattern);
  542. std::sregex_token_iterator it(string.begin(), string.end(), re, -1);
  543. std::sregex_token_iterator end;
  544. PyVarList vec;
  545. for(; it != end; ++it){
  546. vec.push_back(vm->PyStr(it->str()));
  547. }
  548. return vm->PyList(vec);
  549. });
  550. }
  551. class _PkExported{
  552. public:
  553. virtual ~_PkExported() = default;
  554. virtual void* get() = 0;
  555. };
  556. static std::vector<_PkExported*> _pkLookupTable;
  557. template<typename T>
  558. class PkExported : public _PkExported{
  559. T* _ptr;
  560. public:
  561. template<typename... Args>
  562. PkExported(Args&&... args) {
  563. _ptr = new T(std::forward<Args>(args)...);
  564. _pkLookupTable.push_back(this);
  565. }
  566. ~PkExported() override { delete _ptr; }
  567. void* get() override { return _ptr; }
  568. operator T*() { return _ptr; }
  569. };
  570. #define pkpy_allocate(T, ...) *(new PkExported<T>(__VA_ARGS__))
  571. extern "C" {
  572. __EXPORT
  573. /// Delete a pointer allocated by `pkpy_xxx_xxx`.
  574. /// It can be `VM*`, `REPL*`, `char*`, etc.
  575. ///
  576. /// !!!
  577. /// If the pointer is not allocated by `pkpy_xxx_xxx`, the behavior is undefined.
  578. /// !!!
  579. void pkpy_delete(void* p){
  580. for(int i = 0; i < _pkLookupTable.size(); i++){
  581. if(_pkLookupTable[i]->get() == p){
  582. delete _pkLookupTable[i];
  583. _pkLookupTable.erase(_pkLookupTable.begin() + i);
  584. return;
  585. }
  586. }
  587. free(p);
  588. }
  589. __EXPORT
  590. /// Run a given source on a virtual machine.
  591. void pkpy_vm_exec(VM* vm, const char* source){
  592. vm->exec(source, "main.py", EXEC_MODE);
  593. }
  594. __EXPORT
  595. /// Get a global variable of a virtual machine.
  596. ///
  597. /// Return `__repr__` of the result.
  598. /// If the variable is not found, return `nullptr`.
  599. char* pkpy_vm_get_global(VM* vm, const char* name){
  600. auto it = vm->_main->attribs.find(name);
  601. if(it == vm->_main->attribs.end()) return nullptr;
  602. try{
  603. _Str _repr = vm->PyStr_AS_C(vm->asRepr(it->second));
  604. return strdup(_repr.c_str());
  605. }catch(...){
  606. return nullptr;
  607. }
  608. }
  609. __EXPORT
  610. /// Evaluate an expression.
  611. ///
  612. /// Return `__repr__` of the result.
  613. /// If there is any error, return `nullptr`.
  614. char* pkpy_vm_eval(VM* vm, const char* source){
  615. PyVarOrNull ret = vm->exec(source, "<eval>", EVAL_MODE);
  616. if(ret == nullptr) return nullptr;
  617. try{
  618. _Str _repr = vm->PyStr_AS_C(vm->asRepr(ret));
  619. return strdup(_repr.c_str());
  620. }catch(...){
  621. return nullptr;
  622. }
  623. }
  624. __EXPORT
  625. /// Create a REPL, using the given virtual machine as the backend.
  626. REPL* pkpy_new_repl(VM* vm){
  627. return pkpy_allocate(REPL, vm);
  628. }
  629. __EXPORT
  630. /// Input a source line to an interactive console. Return true if need more lines.
  631. bool pkpy_repl_input(REPL* r, const char* line){
  632. return r->input(line);
  633. }
  634. __EXPORT
  635. /// Add a source module into a virtual machine.
  636. void pkpy_vm_add_module(VM* vm, const char* name, const char* source){
  637. vm->_lazy_modules[name] = source;
  638. }
  639. __EXPORT
  640. /// Create a virtual machine.
  641. VM* pkpy_new_vm(bool use_stdio){
  642. VM* vm = pkpy_allocate(VM, use_stdio);
  643. __initializeBuiltinFunctions(vm);
  644. __add_module_sys(vm);
  645. __add_module_time(vm);
  646. __add_module_json(vm);
  647. __add_module_math(vm);
  648. __add_module_re(vm);
  649. __add_module_dis(vm);
  650. // add builtins | no exception handler | must succeed
  651. _Code code = vm->compile(__BUILTINS_CODE, "<builtins>", EXEC_MODE);
  652. vm->_exec(code, vm->builtins, pkpy::make_shared<PyVarDict>());
  653. pkpy_vm_add_module(vm, "random", __RANDOM_CODE);
  654. return vm;
  655. }
  656. __EXPORT
  657. /// Read the standard output and standard error as string of a virtual machine.
  658. /// The `vm->use_stdio` should be `false`.
  659. /// After this operation, both stream will be cleared.
  660. ///
  661. /// Return a json representing the result.
  662. char* pkpy_vm_read_output(VM* vm){
  663. if(vm->use_stdio) return nullptr;
  664. _StrStream* s_out = (_StrStream*)(vm->_stdout);
  665. _StrStream* s_err = (_StrStream*)(vm->_stderr);
  666. _Str _stdout = s_out->str();
  667. _Str _stderr = s_err->str();
  668. _StrStream ss;
  669. ss << '{' << "\"stdout\": " << _stdout.__escape(false);
  670. ss << ", " << "\"stderr\": " << _stderr.__escape(false) << '}';
  671. s_out->str(""); s_err->str("");
  672. return strdup(ss.str().c_str());
  673. }
  674. }
  675. #include "_bindings.h"