diff --git "a/docs/logdump.txt" "b/docs/logdump.txt" new file mode 100644--- /dev/null +++ "b/docs/logdump.txt" @@ -0,0 +1,3273 @@ +Hugging Face's logo +Hugging Face +Models +Datasets +Spaces +Buckets +new +Docs +Enterprise +Pricing + + +Jobs +: + InosLihka +/ +69ed8c25d70108f37acdf744 + +Status + +Canceled +Created + +26/04/2026, 09:23:09 + +Hardware + +a10g-large + +Image + +ghcr.io/astral-sh/uv:python3.12-bookworm +Command + +bash -c 'echo $LOCAL_FILES_ENCODED | xargs -n 2 bash -c '\''echo "$1" | base64 -d > "$0"'\'' && uv run '\''train_on_hf.py'\''' + +Environment variables + +FAST_MODE=1 LOCAL_FILES_ENCODED=train_on_hf.py IyAvLy8gc2NyaXB0CiMgcmVxdWlyZXMtcHl0aG9uID0gIj49My4xMCIKIyBkZXBlbmRlbmNpZXMgPSBbCiMgICAidG9yY2giLAojICAgInRyYW5zZm9ybWVycz09NC41Ni4yIiwKIyAgICJ0cmw9PTAuMjIuMiIsCiMgICAiZGF0YXNldHMiLAojICAgInBlZnQiLAojICAgImFjY2VsZXJhdGUiLAojICAgImJpdHNhbmRieXRlcyIsCiMgICAidW5zbG90aCIsCiMgICAib3BlbmVudi1jb3JlIiwKIyAgICJmYXN0YXBpIiwKIyAgICJ1dmljb3JuIiwKIyAgICJweWRhbnRpYyIsCiMgICAibWF0cGxvdGxpYiIsCiMgICAiaHVnZ2luZ2ZhY2VfaHViIiwKIyBdCiMgLy8vCiIiIgpFbmQtdG8tZW5kIHRyYWluaW5nIGpvYiBmb3IgSEYgSm9icy4KClN1Ym1pdCBmcm9tIGxvY2FsIG1hY2hpbmUgd2l0aDoKICAgIGhmIGpvYnMgdXYgcnVuIC0tZmxhdm9yIGExMGctbGFyZ2UgLS1zZWNyZXRzIEhGX1RPS0VOIHNjcmlwdHMvdHJhaW5fb25faGYucHkKCldoYXQgaXQgZG9lcyAobm8gYmFieXNpdHRpbmcgcmVxdWlyZWQpOgogIDEuIENsb25lIHJoeXRobV9lbnYgZnJvbSBIRiBTcGFjZSAoZ2V0cyBsYXRlc3QgbWV0YS1STCBjb2RlIGZyb20gbWFpbikKICAyLiBHZW5lcmF0ZSBkYXRhc2V0IChjb250aW51b3VzIHByb2ZpbGVzLCBoaW50X2ZyYWN0aW9uPTAuMTUpCiAgMy4gVHJhaW4gUXdlbiAyLjUtM0IgKyBMb1JBIHJhbmsgOCB2aWEgR1JQTyAoMTUwMCBzdGVwcykKICA0LiBSdW4gZXZhbCBvbiBhbGwgMyBjb25kaXRpb25zIChkaXNjcmV0ZSwgaW4tZGlzdCwgT09EKQogIDUuIEdlbmVyYXRlIGFsbCA1IHBsb3RzIGZyb20gbG9nX2hpc3RvcnkKICA2LiBVcGxvYWQgdHJhaW5lZCBtb2RlbCArIHBsb3RzICsgZXZhbCBKU09OIHRvIGEgbmV3IEhGIEh1YiBtb2RlbCByZXBvCgpPdmVycmlkZSBkZWZhdWx0cyB2aWEgZW52IHZhcnM6CiAgICBNQVhfU1RFUFMsIE5VTV9FUElTT0RFUywgTE9SQV9SQU5LLCBCRVRBLCBNT0RFTF9SRVBPCgpFc3RpbWF0ZWQgY29zdCBvbiBhMTBnLWxhcmdlIGF0ICQxLjUwL2hyOiB+JDMgZm9yIDE1MDAgc3RlcHMgKH4yaCkuCiIiIgoKaW1wb3J0IGpzb24KaW1wb3J0IG9zCmltcG9ydCBzaHV0aWwKaW1wb3J0IHN1YnByb2Nlc3MKaW1wb3J0IHN5cwpmcm9tIHBhdGhsaWIgaW1wb3J0IFBhdGgKCiMgLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tCiMgQ29uZmlnIChvdmVycmlkYWJsZSB2aWEgZW52IHZhcnMpCiMgLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tClJFUE9fVVJMID0gb3MuZW52aXJvbi5nZXQoIlJFUE9fVVJMIiwgImh0dHBzOi8vaHVnZ2luZ2ZhY2UuY28vc3BhY2VzL0lub3NMaWhrYS9yaHl0aG1fZW52IikKV09SS19ESVIgPSAiL3RtcC9yaHl0aG1fZW52IgpPVVRQVVRfRElSID0gIi90bXAvcmh5dGhtX2Vudi9vdXRwdXRzL3JoeXRobWVudl9tZXRhX3RyYWluZWQiClBMT1RTX0RJUiA9ICIvdG1wL3JoeXRobV9lbnYvcGxvdHMiCgojIEZBU1RfTU9ERSBwcmVzZXQ6IH4xMC0xNSBtaW4gaXRlcmF0aW9uIG9uIEExMDAgbGFyZ2UuCiMgVXNlIGZvciBoeXBlcnBhcmFtZXRlciBzd2VlcHMgYW5kIHBpcGVsaW5lIGRlYnVnZ2luZy4KRkFTVF9NT0RFID0gb3MuZW52aXJvbi5nZXQoIkZBU1RfTU9ERSIsICIwIikgPT0gIjEiCgppZiBGQVNUX01PREU6CiAgICAjIEl0ZXIgMyBwcmVzZXQ6IDgwMCBzdGVwcyArIDggZ2VuZXJhdGlvbnMgKyBMb1JBIDE2IHRvIGVzY2FwZSBtb2RlIGNvbGxhcHNlIGZvciByZWFsCiAgICBERUZBVUxUUyA9IGRpY3QoTUFYX1NURVBTPTgwMCwgTlVNX0VQSVNPREVTPTIwMCwgTUFYX1NBTVBMRVM9MjAwMCwKICAgICAgICAgICAgICAgICAgICBOVU1fR0VORVJBVElPTlM9OCwgTE9SQV9SQU5LPTE2LCBCRVRBPTAuMDQsCiAgICAgICAgICAgICAgICAgICAgTEVBUk5JTkdfUkFURT01ZS01LCBFVkFMX0VQSVNPREVTPTIpCmVsc2U6CiAgICBERUZBVUxUUyA9IGRpY3QoTUFYX1NURVBTPTIwMDAsIE5VTV9FUElTT0RFUz00MDAsIE1BWF9TQU1QTEVTPTQwMDAsCiAgICAgICAgICAgICAgICAgICAgTlVNX0dFTkVSQVRJT05TPTgsIExPUkFfUkFOSz0xNiwgQkVUQT0wLjA0LAogICAgICAgICAgICAgICAgICAgIExFQVJOSU5HX1JBVEU9NWUtNSwgRVZBTF9FUElTT0RFUz01KQoKTUFYX1NURVBTID0gaW50KG9zLmVudmlyb24uZ2V0KCJNQVhfU1RFUFMiLCBzdHIoREVGQVVMVFNbIk1BWF9TVEVQUyJdKSkpCk5VTV9FUElTT0RFUyA9IGludChvcy5lbnZpcm9uLmdldCgiTlVNX0VQSVNPREVTIiwgc3RyKERFRkFVTFRTWyJOVU1fRVBJU09ERVMiXSkpKQpNQVhfU0FNUExFUyA9IGludChvcy5lbnZpcm9uLmdldCgiTUFYX1NBTVBMRVMiLCBzdHIoREVGQVVMVFNbIk1BWF9TQU1QTEVTIl0pKSkKTlVNX0dFTkVSQVRJT05TID0gaW50KG9zLmVudmlyb24uZ2V0KCJOVU1fR0VORVJBVElPTlMiLCBzdHIoREVGQVVMVFNbIk5VTV9HRU5FUkFUSU9OUyJdKSkpCkxPUkFfUkFOSyA9IGludChvcy5lbnZpcm9uLmdldCgiTE9SQV9SQU5LIiwgc3RyKERFRkFVTFRTWyJMT1JBX1JBTksiXSkpKQpCRVRBID0gZmxvYXQob3MuZW52aXJvbi5nZXQoIkJFVEEiLCBzdHIoREVGQVVMVFNbIkJFVEEiXSkpKQpMRUFSTklOR19SQVRFID0gZmxvYXQob3MuZW52aXJvbi5nZXQoIkxFQVJOSU5HX1JBVEUiLCBzdHIoREVGQVVMVFNbIkxFQVJOSU5HX1JBVEUiXSkpKQpFVkFMX0VQSVNPREVTID0gaW50KG9zLmVudmlyb24uZ2V0KCJFVkFMX0VQSVNPREVTIiwgc3RyKERFRkFVTFRTWyJFVkFMX0VQSVNPREVTIl0pKSkKCiMgRWFjaCBpdGVyYXRpb24gdXBsb2FkcyB0byBhIHVuaXF1ZSByZXBvIGlmIE1PREVMX1JFUE9fU1VGRklYIGlzIHNldApTVUZGSVggPSBvcy5lbnZpcm9uLmdldCgiTU9ERUxfUkVQT19TVUZGSVgiLCAiIikKREVGQVVMVF9SRVBPID0gIklub3NMaWhrYS9yaHl0aG0tZW52LW1ldGEtdHJhaW5lZCIgKyAoZiIte1NVRkZJWH0iIGlmIFNVRkZJWCBlbHNlICIiKQpNT0RFTF9SRVBPID0gb3MuZW52aXJvbi5nZXQoIk1PREVMX1JFUE8iLCBERUZBVUxUX1JFUE8pCgpwcmludChmIj09PSBSdW4gY29uZmlnID09PSIpCnByaW50KGYiICBGQVNUX01PREU6IHtGQVNUX01PREV9IikKcHJpbnQoZiIgIE1BWF9TVEVQUz17TUFYX1NURVBTfSwgTlVNX0VQSVNPREVTPXtOVU1fRVBJU09ERVN9LCBNQVhfU0FNUExFUz17TUFYX1NBTVBMRVN9IikKcHJpbnQoZiIgIE5VTV9HRU5FUkFUSU9OUz17TlVNX0dFTkVSQVRJT05TfSwgTE9SQV9SQU5LPXtMT1JBX1JBTkt9LCBCRVRBPXtCRVRBfSIpCnByaW50KGYiICBMRUFSTklOR19SQVRFPXtMRUFSTklOR19SQVRFfSwgRVZBTF9FUElTT0RFUz17RVZBTF9FUElTT0RFU30iKQpwcmludChmIiAgTU9ERUxfUkVQTz17TU9ERUxfUkVQT30iKQpwcmludCgpCgoKZGVmIHJ1bihjbWQ6IGxpc3Rbc3RyXSwgKiprdyk6CiAgICAiIiJSdW4gc3VicHJvY2VzcyB3aXRoIGxvZ2dpbmcuIiIiCiAgICBwcmludChmIlxuPj4+IHsnICcuam9pbihjbWQpIGlmIGlzaW5zdGFuY2UoY21kLCBsaXN0KSBlbHNlIGNtZH0iLCBmbHVzaD1UcnVlKQogICAgc3VicHJvY2Vzcy5ydW4oY21kLCBjaGVjaz1UcnVlLCAqKmt3KQoKCmRlZiBtYWluKCk6CiAgICAjIC0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLQogICAgIyAxLiBDbG9uZSB0aGUgcmh5dGhtX2VudiByZXBvCiAgICAjIC0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLQogICAgaWYgUGF0aChXT1JLX0RJUikuZXhpc3RzKCk6CiAgICAgICAgc2h1dGlsLnJtdHJlZShXT1JLX0RJUikKICAgIHJ1bihbImdpdCIsICJjbG9uZSIsIFJFUE9fVVJMLCBXT1JLX0RJUl0pCiAgICBvcy5jaGRpcihXT1JLX0RJUikKICAgIHN5cy5wYXRoLmluc2VydCgwLCBXT1JLX0RJUikKICAgIHN5cy5wYXRoLmluc2VydCgwLCBvcy5wYXRoLmpvaW4oV09SS19ESVIsICJ0cmFpbmluZyIpKQoKICAgICMgVmVyaWZ5IG1ldGEtUkwgY29kZSBpcyBwcmVzZW50CiAgICBkYXRhc2V0X3B5ID0gUGF0aCgidHJhaW5pbmcvZGF0YXNldC5weSIpLnJlYWRfdGV4dCgpCiAgICBhc3NlcnQgInByb2ZpbGVfbW9kZSIgaW4gZGF0YXNldF9weSwgIkNsb25lZCByZXBvIGRvZXNuJ3QgaGF2ZSBtZXRhLVJMIGNvZGUiCiAgICBwcmludCgiT0s6IG1ldGEtUkwgY29kZSBwcmVzZW50IGluIGNsb25lZCByZXBvIikKCiAgICAjIC0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLQogICAgIyAyLiBUcmFpbgogICAgIyAtLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0KICAgIHRyYWluX2FyZ3MgPSBbCiAgICAgICAgInB5dGhvbiIsICJ0cmFpbmluZy90cmFpbi5weSIsCiAgICAgICAgIi0tbWF4X3N0ZXBzIiwgc3RyKE1BWF9TVEVQUyksCiAgICAgICAgIi0tbnVtX2VwaXNvZGVzIiwgc3RyKE5VTV9FUElTT0RFUyksCiAgICAgICAgIi0tbWF4X3NhbXBsZXMiLCBzdHIoTUFYX1NBTVBMRVMpLAogICAgICAgICItLW51bV9nZW5lcmF0aW9ucyIsIHN0cihOVU1fR0VORVJBVElPTlMpLAogICAgICAgICItLWxvcmFfcmFuayIsIHN0cihMT1JBX1JBTkspLAogICAgICAgICItLWJldGEiLCBzdHIoQkVUQSksCiAgICAgICAgIi0tbGVhcm5pbmdfcmF0ZSIsIHN0cihMRUFSTklOR19SQVRFKSwKICAgICAgICAiLS1vdXRwdXRfZGlyIiwgT1VUUFVUX0RJUiwKICAgIF0KICAgIHJ1bih0cmFpbl9hcmdzKQoKICAgICMgLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tCiAgICAjIDMuIEV2YWwgKDMgY29uZGl0aW9uczogZGlzY3JldGUtMyAvIGluLWRpc3QgLyBPT0QpCiAgICAjIC0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLQogICAgZXZhbF9hcmdzID0gWwogICAgICAgICJweXRob24iLCAidHJhaW5pbmcvaW5mZXJlbmNlX2V2YWwucHkiLAogICAgICAgICItLW1vZGVsX3BhdGgiLCBPVVRQVVRfRElSLAogICAgICAgICItLW51bV9lcGlzb2RlcyIsIHN0cihFVkFMX0VQSVNPREVTKSwKICAgICAgICAiLS1vdXRwdXRfZmlsZSIsICJldmFsX3Jlc3VsdHMuanNvbiIsCiAgICBdCiAgICBydW4oZXZhbF9hcmdzKQoKICAgICMgLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tCiAgICAjIDQuIEdlbmVyYXRlIHBsb3RzIGZyb20gc2F2ZWQgbG9nX2hpc3RvcnkKICAgICMgLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tCiAgICBQYXRoKFBMT1RTX0RJUikubWtkaXIoZXhpc3Rfb2s9VHJ1ZSkKICAgIGxvZ19wYXRoID0gb3MucGF0aC5qb2luKE9VVFBVVF9ESVIsICJsb2dfaGlzdG9yeS5qc29uIikKICAgIGlmIFBhdGgobG9nX3BhdGgpLmV4aXN0cygpOgogICAgICAgIHJ1bihbInB5dGhvbiIsICJzY3JpcHRzL3Bsb3RfZnJvbV9sb2cucHkiLCAiLS1sb2ciLCBsb2dfcGF0aCwgIi0tb3V0IiwgUExPVFNfRElSXSkKICAgIGVsc2U6CiAgICAgICAgcHJpbnQoZiJXQVJOSU5HOiBsb2dfaGlzdG9yeS5qc29uIG5vdCBmb3VuZCBhdCB7bG9nX3BhdGh9IikKCiAgICAjIC0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLQogICAgIyA1LiBVcGxvYWQgZXZlcnl0aGluZyB0byBIRiBIdWIKICAgICMgLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tLS0tCiAgICB0b2tlbiA9IG9zLmVudmlyb24uZ2V0KCJIRl9UT0tFTiIpCiAgICBpZiBub3QgdG9rZW46CiAgICAgICAgcHJpbnQoIldBUk5JTkc6IEhGX1RPS0VOIG5vdCBzZXQsIHNraXBwaW5nIHVwbG9hZCIpCiAgICAgICAgcHJpbnQoZiJPdXRwdXRzIGluOiB7T1VUUFVUX0RJUn0iKQogICAgICAgIHJldHVybgoKICAgIGZyb20gaHVnZ2luZ2ZhY2VfaHViIGltcG9ydCBIZkFwaSwgbG9naW4KICAgIGxvZ2luKHRva2VuPXRva2VuKQogICAgYXBpID0gSGZBcGkoKQogICAgYXBpLmNyZWF0ZV9yZXBvKE1PREVMX1JFUE8sIGV4aXN0X29rPVRydWUsIHJlcG9fdHlwZT0ibW9kZWwiKQoKICAgICMgVXBsb2FkIHRyYWluZWQgbW9kZWwgKyBjb25maWcgKyBsb2dfaGlzdG9yeQogICAgYXBpLnVwbG9hZF9mb2xkZXIoCiAgICAgICAgZm9sZGVyX3BhdGg9T1VUUFVUX0RJUiwKICAgICAgICByZXBvX2lkPU1PREVMX1JFUE8sCiAgICAgICAgcmVwb190eXBlPSJtb2RlbCIsCiAgICAgICAgY29tbWl0X21lc3NhZ2U9ZiJUcmFpbmVkIHtNQVhfU1RFUFN9LXN0ZXAgR1JQTyBtZXRhLVJMIGFnZW50IiwKICAgICkKCiAgICAjIFVwbG9hZCBldmFsIEpTT04KICAgIGFwaS51cGxvYWRfZmlsZSgKICAgICAgICBwYXRoX29yX2ZpbGVvYmo9ImV2YWxfcmVzdWx0cy5qc29uIiwKICAgICAgICBwYXRoX2luX3JlcG89ImV2YWxfcmVzdWx0cy5qc29uIiwKICAgICAgICByZXBvX2lkPU1PREVMX1JFUE8sCiAgICAgICAgcmVwb190eXBlPSJtb2RlbCIsCiAgICApCgogICAgIyBVcGxvYWQgcGxvdHMgaWYgZ2VuZXJhdGVkCiAgICBpZiBQYXRoKFBMT1RTX0RJUikuZXhpc3RzKCkgYW5kIGFueShQYXRoKFBMT1RTX0RJUikuaXRlcmRpcigpKToKICAgICAgICBhcGkudXBsb2FkX2ZvbGRlcigKICAgICAgICAgICAgZm9sZGVyX3BhdGg9UExPVFNfRElSLAogICAgICAgICAgICBwYXRoX2luX3JlcG89InBsb3RzIiwKICAgICAgICAgICAgcmVwb19pZD1NT0RFTF9SRVBPLAogICAgICAgICAgICByZXBvX3R5cGU9Im1vZGVsIiwKICAgICAgICApCgogICAgcHJpbnQoKQogICAgcHJpbnQoIj0iICogNjApCiAgICBwcmludCgiRE9ORSIpCiAgICBwcmludChmIiAgVHJhaW5lZCBtb2RlbDogaHR0cHM6Ly9odWdnaW5nZmFjZS5jby97TU9ERUxfUkVQT30iKQogICAgcHJpbnQoZiIgIEV2YWwgSlNPTjogICAgIGh0dHBzOi8vaHVnZ2luZ2ZhY2UuY28ve01PREVMX1JFUE99L2Jsb2IvbWFpbi9ldmFsX3Jlc3VsdHMuanNvbiIpCiAgICBwcmludChmIiAgUGxvdHM6ICAgICAgICAgaHR0cHM6Ly9odWdnaW5nZmFjZS5jby97TU9ERUxfUkVQT30vdHJlZS9tYWluL3Bsb3RzIikKICAgIHByaW50KCI9IiAqIDYwKQoKCmlmIF9fbmFtZV9fID09ICJfX21haW5fXyI6CiAgICBtYWluKCkK MODEL_REPO_SUFFIX=iter4 +Secrets + +HF_TOKEN +Logs +===== Job started at 2026-04-26 03:53:10 ===== + +Downloading hf-xet (4.0MiB) + +Downloading pydantic-core (2.0MiB) + +Downloading kiwisolver (1.4MiB) + +Downloading pyarrow (46.6MiB) + +Downloading transformers (11.1MiB) + +Downloading hf-transfer (3.4MiB) + +Downloading nvidia-cufile-cu12 (1.1MiB) + +Downloading cryptography (4.5MiB) + +Downloading networkx (2.0MiB) + +Downloading torchvision (7.7MiB) + +Downloading nvidia-nvjitlink-cu12 (37.4MiB) + +Downloading pillow (6.8MiB) + +Downloading pygments (1.2MiB) + +Downloading unsloth (63.9MiB) + +Downloading openai (1.1MiB) + +Downloading sympy (6.0MiB) + +Downloading brotli (1.4MiB) + +Downloading fonttools (4.8MiB) + +Downloading triton (179.5MiB) + +Downloading numpy (15.9MiB) + +Downloading nvidia-cudnn-cu12 (674.0MiB) + +Downloading aiohttp (1.7MiB) + +Downloading nvidia-curand-cu12 (60.7MiB) + +Downloading nvidia-cusparselt-cu12 (273.9MiB) + +Downloading nvidia-cuda-nvrtc-cu12 (84.0MiB) + +Downloading nvidia-cuda-cupti-cu12 (9.8MiB) + +Downloading nvidia-nccl-cu12 (307.4MiB) + +Downloading tokenizers (3.1MiB) + +Downloading matplotlib (8.4MiB) + +Downloading nvidia-nvshmem-cu12 (132.7MiB) + +Downloading pandas (10.4MiB) + +Downloading xformers (3.1MiB) + +Downloading beartype (1.3MiB) + +Downloading torch (873.2MiB) + +Downloading nvidia-cufft-cu12 (184.2MiB) + +Downloading nvidia-cusparse-cu12 (274.9MiB) + +Downloading nvidia-cusolver-cu12 (255.1MiB) + +Downloading gradio (18.8MiB) + +Downloading bitsandbytes (57.8MiB) + +Downloading nvidia-cublas-cu12 (566.8MiB) + +Downloading diffusers (4.8MiB) + +Downloading torchao (3.1MiB) + +Downloading cuda-bindings (11.6MiB) + +Downloading sentencepiece (1.3MiB) + + Downloaded nvidia-cufile-cu12 + + Downloaded pygments + + Downloaded beartype + + Downloaded sentencepiece + + Downloaded brotli + + Downloaded kiwisolver + + Downloaded aiohttp + + Downloaded pydantic-core + + Downloaded networkx + + Downloaded tokenizers + + Downloaded openai + + Downloaded xformers + + Downloaded hf-transfer + + Downloaded hf-xet + + Downloaded cryptography + + Downloaded torchao + + Downloaded fonttools + + Downloaded diffusers + + Downloaded pillow + + Downloaded torchvision + + Downloaded sympy + + Downloaded matplotlib + + Downloaded nvidia-cuda-cupti-cu12 + + Downloaded cuda-bindings + + Downloaded transformers + + Downloaded numpy + + Downloaded pandas + + Downloaded gradio + + Downloaded nvidia-nvjitlink-cu12 + + Downloaded bitsandbytes + + Downloaded nvidia-curand-cu12 + + Downloaded pyarrow + + Downloaded nvidia-cuda-nvrtc-cu12 + + Downloaded unsloth + + Downloaded nvidia-nvshmem-cu12 + + Downloaded nvidia-cufft-cu12 + + Downloaded triton + + Downloaded nvidia-cusolver-cu12 + + Downloaded nvidia-cusparselt-cu12 + + Downloaded nvidia-cusparse-cu12 + + Downloaded nvidia-nccl-cu12 + + Downloaded nvidia-cublas-cu12 + + Downloaded nvidia-cudnn-cu12 + + Downloaded torch + +Installed 172 packages in 531ms + +=== Run config === + + FAST_MODE: True + + MAX_STEPS=800, NUM_EPISODES=200, MAX_SAMPLES=2000 + + NUM_GENERATIONS=8, LORA_RANK=16, BETA=0.04 + + LEARNING_RATE=5e-05, EVAL_EPISODES=2 + + MODEL_REPO=InosLihka/rhythm-env-meta-trained-iter4 + + + +>>> git clone https://huggingface.co/spaces/InosLihka/rhythm_env /tmp/rhythm_env + +Cloning into '/tmp/rhythm_env'... + +OK: meta-RL code present in cloned repo + + +>>> python training/train.py --max_steps 800 --num_episodes 200 --max_samples 2000 --num_generations 8 --lora_rank 16 --beta 0.04 --learning_rate 5e-05 --output_dir /tmp/rhythm_env/outputs/rhythmenv_meta_trained + +============================================================ + +Step 1: Generating training dataset (continuous profiles) + +============================================================ + +Generated 2000 samples from 72 episodes (0 with profile hint, 2000 without) + +Dataset size: 2000 + + +============================================================ + +Step 2: Loading model unsloth/Qwen2.5-3B-Instruct + +============================================================ + +🦥 Unsloth: Will patch your computer to enable 2x faster free finetuning. + +🦥 Unsloth Zoo will now patch everything to make training faster! + +==((====))== Unsloth 2026.4.8: Fast Qwen2 patching. Transformers: 4.56.2. + + \\ /| NVIDIA A10G. Num GPUs = 1. Max memory: 22.301 GB. Platform: Linux. + +O^O/ \_/ \ Torch: 2.10.0+cu128. CUDA: 8.6. CUDA Toolkit: 12.8. Triton: 3.6.0 + +\ / Bfloat16 = TRUE. FA [Xformers = 0.0.35. FA2 = False] + + "-____-" Free license: http://github.com/unslothai/unsloth + +Unsloth: Fast downloading is enabled - ignore downloading bars which are red colored! + + + +model.safetensors: 0%| | 0.00/2.36G [00:00. + +Unsloth 2026.4.8 patched 36 layers with 36 QKV layers, 36 O layers and 36 MLP layers. + +LoRA rank: 16, alpha: 32 + + +============================================================ + +Step 3: Setting up reward functions + +============================================================ + +Using: format_valid + action_legal + env_reward + belief_accuracy + + +============================================================ + +Step 4: Configuring GRPO trainer + +============================================================ + +Unsloth: We now expect `per_device_train_batch_size` * `gradient_accumulation_steps` * `world_size` to be a multiple of `num_generations`. + +We will change the batch size of 1 to the `num_generations` of 8 + +Using GRPOConfig with reward_weights=[0.05, 0.05, 1.5, 3.0] + +max_steps=800, num_generations=8, lr=5e-05, beta=0.04 + +max_prompt_length=600, max_completion_length=32 + +hint_fraction=0.0 (curriculum warmup) + + +============================================================ + +Step 5: Starting GRPO training + +============================================================ + +==((====))== Unsloth - 2x faster free finetuning | Num GPUs used = 1 + + \\ /| Num examples = 2,000 | Num Epochs = 2 | Total steps = 800 + +O^O/ \_/ \ Batch size per device = 8 | Gradient accumulation steps = 4 + +\ / Data Parallel GPUs = 1 | Total batch size (8 x 4 x 1) = 32 + + "-____-" Trainable parameters = 29,933,568 of 3,115,872,256 (0.96% trained) + + +Unsloth: Will smartly offload gradients to save VRAM! + + + 0%| | 0/800 [00:00