TensorCat commited on
Commit
422dab1
·
verified ·
1 Parent(s): 0ded223

Delete UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/.DS_Store +0 -0
  2. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/dataset_split_summary.json +0 -14
  3. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/generation_eval/generation_details.jsonl +0 -20
  4. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/generation_eval/generation_metrics.json +0 -10
  5. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/lora_adapter/README.md +0 -209
  6. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/lora_adapter/adapter_config.json +0 -46
  7. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/lora_adapter/adapter_model.safetensors +0 -3
  8. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/lora_adapter/chat_template.jinja +0 -89
  9. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/lora_adapter/tokenizer.json +0 -3
  10. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/lora_adapter/tokenizer_config.json +0 -29
  11. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/lora_adapter/training_args.bin +0 -3
  12. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/rag_augmented_dataset/rag_augmented_sft_dataset.jsonl +0 -0
  13. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/rag_augmented_dataset/rag_augmented_sft_dataset_preview.json +0 -212
  14. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/rag_augmented_dataset/rag_text_length_summary.json +0 -11
  15. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/retrieval_eval/retrieval_details.jsonl +0 -0
  16. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/retrieval_eval/retrieval_metrics.json +0 -10
  17. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/README.md +0 -57
  18. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-1000/README.md +0 -209
  19. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-1000/adapter_config.json +0 -46
  20. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-1000/adapter_model.safetensors +0 -3
  21. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-1000/chat_template.jinja +0 -89
  22. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-1000/optimizer.pt +0 -3
  23. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-1000/rng_state.pth +0 -3
  24. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-1000/scheduler.pt +0 -3
  25. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-1000/tokenizer.json +0 -3
  26. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-1000/tokenizer_config.json +0 -29
  27. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-1000/trainer_state.json +0 -553
  28. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-1000/training_args.bin +0 -3
  29. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-900/README.md +0 -209
  30. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-900/adapter_config.json +0 -46
  31. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-900/adapter_model.safetensors +0 -3
  32. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-900/chat_template.jinja +0 -89
  33. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-900/optimizer.pt +0 -3
  34. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-900/rng_state.pth +0 -3
  35. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-900/scheduler.pt +0 -3
  36. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-900/tokenizer.json +0 -3
  37. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-900/tokenizer_config.json +0 -29
  38. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-900/trainer_state.json +0 -502
  39. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-900/training_args.bin +0 -3
  40. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/hf_dataset_dict/dataset_dict.json +0 -1
  41. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/hf_dataset_dict/test/data-00000-of-00001.arrow +0 -3
  42. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/hf_dataset_dict/test/dataset_info.json +0 -89
  43. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/hf_dataset_dict/test/state.json +0 -13
  44. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/hf_dataset_dict/train/data-00000-of-00001.arrow +0 -3
  45. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/hf_dataset_dict/train/dataset_info.json +0 -89
  46. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/hf_dataset_dict/train/state.json +0 -13
  47. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/hf_dataset_dict/validation/data-00000-of-00001.arrow +0 -3
  48. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/hf_dataset_dict/validation/dataset_info.json +0 -89
  49. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/hf_dataset_dict/validation/state.json +0 -13
  50. UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/train_metrics.json +0 -7
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/.DS_Store DELETED
Binary file (8.2 kB)
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/dataset_split_summary.json DELETED
@@ -1,14 +0,0 @@
1
- {
2
- "dataset_path": "/scr/user/kevin2002/TensorCat/NLP/UM_Handbook/Dataset/SFT_Dataset/SFT_QA_Training_Ready.jsonl",
3
- "metadata_path": "/scr/user/kevin2002/TensorCat/NLP/UM_Handbook/Dataset/SFT_Dataset/SFT_QA_Metadata.jsonl",
4
- "rag_kb_path": "/scr/user/kevin2002/TensorCat/NLP/UM_Handbook/Dataset/RAG/UM_RAG_Knowledge_Base.jsonl",
5
- "rag_augmented_dataset_path": "/scr/user/kevin2002/TensorCat/NLP/UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/rag_augmented_dataset/rag_augmented_sft_dataset.jsonl",
6
- "total_examples": 1000,
7
- "train_examples": 800,
8
- "validation_examples": 100,
9
- "test_examples": 100,
10
- "seed": 42,
11
- "train_ratio": 0.8,
12
- "validation_ratio": 0.1,
13
- "test_ratio": 0.1
14
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/generation_eval/generation_details.jsonl DELETED
@@ -1,20 +0,0 @@
1
- {"qa_id": "qa_000031", "index_id": "UMI-0031", "query": "What are the programme goals, objectives, or learning outcomes for Master in Data Science?", "gold_answer": "The programme objectives describe data scientists who can extract meaningful insights, deliver effective data science solutions, sustain lifelong learning with an entrepreneurial mindset, and lead or contribute responsibly in public or private organisations. The learning outcomes highlight mastery of important data science concepts, recommending innovative data science and scientific computing solutions, constructing efficient data science tools, communicating with stakeholders, publishing and presenting solutions, using digital and analytic skills to acquire and interpret knowledge, leadership, lifelong learning, entrepreneurship, and professional ethics.", "plain_answer": "<think>\n\nSource document: General Handbook Format\n\nScope: postgraduate\n\nSection: Postgraduate Faculty Identity\n\nSubsection: Programme Education Objectives and Learning Outcomes\n\nKnowledge group: KG-0019\n\nChunk id: SC-0021\n\nEvidence:\nPROGRAMME EDUCATION OBJECTIVES AND LEARNING OUTCOMES PROGRAMME EDUCATION OBJECTIVES (PEO) Entry Level PEO1 Graduates are equipped with a wider breadth of knowledge in data science and deeper intelligence to solve problems by extracting and acquiring knowledge from data. PEO2 Graduates demonstrate leadership qualities with an entrepreneurial mindset in executing projects related to data", "rag_answer": "<think>\n\n</think>\n\nThe programme objectives describe data scientists who can extract meaningful insights for organisations, deliver effective data science solutions for stakeholders, engage in lifelong learning with an entrepreneurial mindset, and lead or contribute responsibly in public or private organisations. The learning outcomes highlight mastery of important data science concepts, recommending innovative data science and scientific computing solutions, constructing efficient data science tools, communicating with diverse audiences, publishing and presenting solutions in academic or industrial platforms, using digital skills to acquire and interpret knowledge, and demonstrating leadership, teamwork, and lifelong learning capabilities.", "plain_exact_match": 0.0, "plain_token_f1": 0.2857, "rag_exact_match": 0.0, "rag_token_f1": 0.8721, "retrieved_kb_ids": ["RAGKB-0427", "RAGKB-0428", "RAGKB-0429"], "retrieved_sections": ["Master in Data Science", "Master in Data Science", "Master in Data Science"], "retrieved_scopes": ["postgraduate", "postgraduate", "postgraduate"]}
2
- {"qa_id": "qa_000883", "index_id": "UMI-0883", "query": "Ngl, what distinctive specialization focus is highlighted for Bachelor of Computer Science (Information Systems)?", "gold_answer": "The distinctive specialization focus is Information Systems, with deeper emphasis on Information Systems techniques for analysing information, designing solutions, and developing computer-based systems.", "plain_answer": "<think>\n\n[]){\n</think>\n\nThe distinctive specialization focus highlighted for Bachelor of Computer Science (Information Systems) is information systems.", "rag_answer": "<think>\n\n</think>\n\nThe distinctive specialization focus is Information Systems, with deeper emphasis on Information Systems techniques for analysing information, designing information systems, and developing computer-based solutions.", "plain_exact_match": 0.0, "plain_token_f1": 0.5366, "rag_exact_match": 0.0, "rag_token_f1": 0.9412, "retrieved_kb_ids": ["RAGKB-0336", "RAGKB-0338", "RAGKB-0341"], "retrieved_sections": ["Undergraduate Programme Goals and Learning Outcomes", "Undergraduate Programme Goals and Learning Outcomes", "Undergraduate Programme Goals and Learning Outcomes"], "retrieved_scopes": ["undergraduate", "undergraduate", "undergraduate"]}
3
- {"qa_id": "qa_000387", "index_id": "UMI-0387", "query": "What policy links, regulations, or university rule documents are referenced for undergraduate students?", "gold_answer": "The undergraduate rules section refers students to the University of Malaya Bachelor's Degree rules and regulations, together with related university policy and administrative references.", "plain_answer": "<think>\n\nAh, the handbook evidence retrieved for this query shows that the undergraduate rules referenced include the Universiti Malaya (Undergraduate Rules) 2021/2024, the Universiti Malaya (Discipline of Students) Rules 1999, the Universiti Malaya (Examination) Rules 2025, the Universiti Malaya (Minimum Grade Requirement in Foundation/Vocation Modules) 2012, and the Universiti Malaya (Student Misconduct) Rules 2018. The linked policies include the Bachelor Degree Bachelor of Computer Science programme rules, the", "rag_answer": "<think>\n\n</think>\n\nThe undergraduate rules section refers students to the University of Malaya Bachelor's Degree rules and regulations, together with related university policy and administrative references.", "plain_exact_match": 0.0, "plain_token_f1": 0.2316, "rag_exact_match": 0.0, "rag_token_f1": 0.9615, "retrieved_kb_ids": ["RAGKB-0320", "RAGKB-0142", "RAGKB-0049"], "retrieved_sections": ["Undergraduate Rules and Regulations", "Undergraduate Faculty Identity", "Postgraduate General Information"], "retrieved_scopes": ["undergraduate", "undergraduate", "postgraduate"]}
4
- {"qa_id": "qa_000254", "index_id": "UMI-0254", "query": "What major milestones appear in the Graduate on Time schedule for Master of Computer Science (By Research)?", "gold_answer": "The Graduate on Time schedule for Master of Computer Science (By Research) lays out the expected semester-by-semester milestones for timely completion, including candidature progression, research-related stages, and expected outputs where applicable.", "plain_answer": "<think>\n\nSource document: Complete Handbook Semester 1 2025/2026 Knowledge Engineering and Medical Computing Lead by Dr. Wai Yan Chan Assistant Lead by Dr. Hoo Wai Lam : Assistant Prof. Dr. Amirrudin M. Noor Pathology of Medicine and Medical Imaging Medical Representation and Knowledge Engineering : Natural Language Processing Knowledge Engineering Security and Quantum Computing : Quantum Computing Foundation Quantum Key Distribution Machine Learning and Artificial Intelligence Linking Data and Semantics Metadata and Information Management : Big Data Analytics Business Analytics and Data Science : Big Data Applications Business Analytics and Data Science Social Media Data Analytics : Social Network Analysis and", "rag_answer": "<think>\n\n</think>\n\nThe Graduate on Time schedule for Master of Computer Science (By Research) maps the expected semester-by-semester milestones, including coursework completion, research proposal development and defence, ethics approval where applicable, dissertation stages, and the expected submission timeline for related academic outputs.", "plain_exact_match": 0.0, "plain_token_f1": 0.0923, "rag_exact_match": 0.0, "rag_token_f1": 0.7436, "retrieved_kb_ids": ["RAGKB-0509", "RAGKB-0510", "RAGKB-0374"], "retrieved_sections": ["Master of Computer Science (By Research)", "Master of Computer Science (By Research)", "Master of Computer Science (Applied Computing)"], "retrieved_scopes": ["postgraduate", "postgraduate", "postgraduate"]}
5
- {"qa_id": "qa_000129", "index_id": "UMI-0129", "query": "When was the Faculty of Computer Science and Information Technology officially formed?", "gold_answer": "The Universiti Malaya Council agreed to the formation of FCSIT on 22 September 1994.", "plain_answer": "<think>\n\n[Retrieved Evidence 1]\nSource document: General Handbook\nScope: general\nSection: History\nSubsection: History Overview\nKeywords: history overview, fcsit, computer technology, 1967, 1967 - 1993, 1993 - 2000, 2000 - 2010, 2010 - 2019, 2019 - 2025\nPages: 106\nChunk id: SC-00355\nText:\nHistory", "rag_answer": "<think>\n\n</think>\n\nThe faculty was officially formed in 1994 through the Universities and University Colleges Act.", "plain_exact_match": 0.0, "plain_token_f1": 0.037, "rag_exact_match": 0.0, "rag_token_f1": 0.2, "retrieved_kb_ids": ["RAGKB-0003", "RAGKB-0004", "RAGKB-0002"], "retrieved_sections": ["History of the Faculty", "History of the Faculty", "History of the Faculty"], "retrieved_scopes": ["general", "general", "general"]}
6
- {"qa_id": "qa_000308", "index_id": "UMI-0308", "query": "What distinctive specialization focus is highlighted for Bachelor of Computer Science (Artificial Intelligence)?", "gold_answer": "The specialization focus highlighted for Bachelor of Computer Science (Artificial Intelligence) is artificial intelligence, as reflected by the programme title and its learning-outcome emphasis.", "plain_answer": "<think>\n\n[Retrieved Evidence 1]\nThe Bachelor of Computer Science (Artificial Intelligence) programme will produce graduates who are able to demonstrate graduate attributes such as: 1. Update knowledge on the latest computer science and Artificial Intelligence techniques and tools to address current problems by constantly learning new concepts and practices, especially those related to algorithmic development, system analysis and design, and data ...[truncated]\n\n[Retrieved Evidence 2]\nPROGRAMME EDUCATIONAL OBJECTIVE (PEO) 1. Graduates engaged in careers related to the computing industry and involved in activities including but not limited to software development, system analysis and design,", "rag_answer": "<think>\n\n</think>\n\nThe specialization focus highlighted for Bachelor of Computer Science (Artificial Intelligence) is artificial intelligence, as reflected by the programme title and its learning-outcome emphasis.", "plain_exact_match": 0.0, "plain_token_f1": 0.2521, "rag_exact_match": 0.0, "rag_token_f1": 0.9615, "retrieved_kb_ids": ["RAGKB-0328", "RAGKB-0330", "RAGKB-0333"], "retrieved_sections": ["Undergraduate Programme Goals and Learning Outcomes", "Undergraduate Programme Goals and Learning Outcomes", "Undergraduate Programme Goals and Learning Outcomes"], "retrieved_scopes": ["undergraduate", "undergraduate", "undergraduate"]}
7
- {"qa_id": "qa_000641", "index_id": "UMI-0641", "query": "Could you list the main lecture periods for bachelor degree students in Semester II of session 2025/2026?", "gold_answer": "For bachelor degree students in Semester II, the main lecture periods are 09.03.2026 to 26.04.2026 and 04.05.2026 to 21.06.2026.", "plain_answer": "<think>\n\nOkay, the user is asking about the main lecture periods for Bachelor's students in Semester II of the 2025/2026 session. Let me check the handbook.\n\n[Looks at retrieved evidence]\n\nThe handbook states that for Semester II, the main lecture periods are Week 5 to Week 17, with a two-week break in the middle. It also mentions that the start and end weeks might vary slightly depending on public and festive holidays. \n\nSo the answer should mention the main lecture period as Week 5 to Week 17, note the two-week break, and indicate that the exact weeks", "rag_answer": "<think>\n\n</think>\n\nThe main lecture periods for Bachelor Degree Level in Semester II are shown in a calendar structure. They include revision time, revision week, examination time, and the stated break periods.", "plain_exact_match": 0.0, "plain_token_f1": 0.2344, "rag_exact_match": 0.0, "rag_token_f1": 0.4068, "retrieved_kb_ids": ["RAGKB-0008", "RAGKB-0009", "RAGKB-0006"], "retrieved_sections": ["Academic Calendar 2025/2026", "Academic Calendar 2025/2026", "Academic Calendar 2025/2026"], "retrieved_scopes": ["undergraduate", "undergraduate", "postgraduate"]}
8
- {"qa_id": "qa_000799", "index_id": "UMI-0799", "query": "Quick one: what graduate or research capabilities are highlighted in the learning objectives and outcomes for Master of Computer Science (By Research)?", "gold_answer": "The learning objectives and outcomes highlight the ability to apply and integrate knowledge of current computer science research issues, evaluate and analyse computing solutions, develop and assess research outcomes, use appropriate research methods to acquire and extend knowledge, communicate and publish technical work effectively, work independently and in groups, and demonstrate ethical and professionally responsible research conduct.", "plain_answer": "<think>\n\nOkay, let me check the handbook for the learning objectives and outcomes of Master of Computer Science (By Research). The user is asking which graduate or research capabilities are highlighted there.\n\n[Searches the handbook]\n\nThe handbook states that upon completion of the programme, graduates can:\r\n\r\n1. Demonstrate a deeper understanding of the principles, concepts, and theories in computer science. \r\n2. Exhibit the ability to integrate knowledge and skills in conducting independent research in the selected computer science area. \r\n3. Display strong character attributes such as perseverance, responsibility, and the ability to work independently. \r\n\r\nThe programme learning objectives also emphasise advancing knowledge", "rag_answer": "<think>\n\n</think>\n\nThe learning objectives and outcomes highlight the ability to apply and integrate knowledge of current computer science research issues, evaluate and analyse computing solutions, develop and assess research outcomes, use appropriate research methods to acquire and extend knowledge, communicate and publish technical work effectively, work independently and in groups, and demonstrate ethical and professionally responsible research behaviour.", "plain_exact_match": 0.0, "plain_token_f1": 0.3145, "rag_exact_match": 0.0, "rag_token_f1": 0.9655, "retrieved_kb_ids": ["RAGKB-0504", "RAGKB-0505", "RAGKB-0506"], "retrieved_sections": ["Master of Computer Science (By Research)", "Master of Computer Science (By Research)", "Master of Computer Science (By Research)"], "retrieved_scopes": ["postgraduate", "postgraduate", "postgraduate"]}
9
- {"qa_id": "qa_000986", "index_id": "UMI-0986", "query": "Could you tell me what dress expectations are illustrated for official events?", "gold_answer": "For official events, the poster illustrates formal attire, including suit-style clothing and traditional formal wear, to convey a neat and official appearance appropriate for formal university occasions.", "plain_answer": "<think>\n\nOkay, so the user is asking about the dress expectations for official events based on the retrieved handbook evidence. Let me look at the evidence provided.\n\nThe retrieved text is from the postgraduate dress code and covers pages 24 and 25. It starts by emphasizing that the handbook is a general guide and does not create any binding legal or contractual obligations. Then, under Dress Code in Official Events, it states that the attire should reflect good taste and be in line with the university's image. The expectations are illustrated as follows:\n\nFor men:\n- Formal events: a traditional Bahasa costume or formal business suit with a", "rag_answer": "<think>\n\n</think>\n\nThe poster illustrates formal or traditional formal attire for official university occasions.", "plain_exact_match": 0.0, "plain_token_f1": 0.2206, "rag_exact_match": 0.0, "rag_token_f1": 0.5238, "retrieved_kb_ids": ["RAGKB-0319", "RAGKB-0138", "RAGKB-0071"], "retrieved_sections": ["Student Dress Code", "Research Guidance", "Research Guidance"], "retrieved_scopes": ["general", "postgraduate", "postgraduate"]}
10
- {"qa_id": "qa_000566", "index_id": "UMI-0566", "query": "Could you tell me what schedule must students follow during industrial training?", "gold_answer": "A week-by-week schedule for students during Industrial Training, including placement approval, logbook submission, faculty supervision checkpoints, and final report submission.", "plain_answer": "<think>\n\nOkay, so the user is asking about the schedule students must follow during Industrial Training. Let me check the retrieved evidence.\n\nThe handbook says the Industrial Training Schedule includes eight weeks of training starting from the third or fourth semester, depending on the faculty. It mentions the week before the training starts as the Industrial Training Orientation and Workshop (ITOW), which has five main stages: Ice-Breaking and Health & Safety Talk, Company Placement, Technical Workshop 1, Industrial Training Week, and Technical Workshop 2. The eight weeks of training are divided into four weeks in the company and four weeks at the faculty, with specific weeks for log", "rag_answer": "<think>\n\n</think>\n\nStudents must follow the approved Industrial Training schedule, which includes the planned weeks of training, the required assessment and reporting periods, and the approved completion milestone.", "plain_exact_match": 0.0, "plain_token_f1": 0.1692, "rag_exact_match": 0.0, "rag_token_f1": 0.2, "retrieved_kb_ids": ["RAGKB-0285", "RAGKB-0287", "RAGKB-0289"], "retrieved_sections": ["Industrial Training", "Industrial Training", "Industrial Training"], "retrieved_scopes": ["undergraduate", "undergraduate", "undergraduate"]}
11
- {"qa_id": "qa_000994", "index_id": "UMI-0994", "query": "Quick check: what consequences or disciplinary actions are implied for examination dishonesty?", "gold_answer": "The consequences are disciplinary in nature. The handbook points students to official Universiti Malaya academic dishonesty, examination misconduct, and student discipline rules, which means dishonest conduct may trigger action under the university's disciplinary framework.", "plain_answer": "<think>\n\nOkay, so the user is asking about the consequences or disciplinary actions for examination dishonesty. Let me check the retrieved evidence first.\n\n[Retrieved Evidence 1]\nSource document: Complete Handbook\nScope: undergraduate\nSection: Examination Honesty and Discipline / Undergraduate Rules\nSubsection: Examination Honesty and Discipline\nPages: 111\nKnowledge group: KG-0061\nChunk id: SC-00321\nText:\nEXAMINATION HONESTY AND DISCIPLINE Link: https://umsitsmumum.um.edu.my The Universiti Malaya Senate Academic Press", "rag_answer": "<think>\n\n</think>\n\nThe consequences are disciplinary in nature. The handbook points students to official Universiti Malaya academic dishonesty, examination misconduct, and student discipline rules, which means dishonest conduct may trigger disciplinary action under the university's regulations.", "plain_exact_match": 0.0, "plain_token_f1": 0.2642, "rag_exact_match": 0.0, "rag_token_f1": 0.9444, "retrieved_kb_ids": ["RAGKB-0320", "RAGKB-0321", "RAGKB-0292"], "retrieved_sections": ["Undergraduate Rules and Regulations", "Examination Grading Scheme", "Industrial Training"], "retrieved_scopes": ["undergraduate", "undergraduate", "undergraduate"]}
12
- {"qa_id": "qa_000105", "index_id": "UMI-0105", "query": "What is the process flow for Academic Project II?", "gold_answer": "The handbook presents Academic Project as a staged process covering topic or title approval, supervision, progress monitoring, submission through the ilmiah system, viva or evaluation sessions, and final report completion across Academic Project I and Academic Project II.", "plain_answer": "<think>\n\nv\n\nThe process flow for Academic Project II includes the following steps: (1) Students undergo software requirements gathering and analysis, (2) Students develop a project proposal, (3) Students undergo software design and coding, (4) Students test the developed system, and (6) Students prepare for acceptance by running the project and conducting the final report presentation & viva session.", "rag_answer": "<think>\n\n</think>\n\nThe handbook presents Academic Project as a staged process covering topic or title approval, supervision, progress monitoring, submission through the ilmiah system, viva or evaluation sessions, and final report completion across Academic Project I and Academic Project II.", "plain_exact_match": 0.0, "plain_token_f1": 0.3125, "rag_exact_match": 0.0, "rag_token_f1": 0.9744, "retrieved_kb_ids": ["RAGKB-0301", "RAGKB-0296", "RAGKB-0297"], "retrieved_sections": ["Academic Project", "Academic Project", "Academic Project"], "retrieved_scopes": ["undergraduate", "undergraduate", "undergraduate"]}
13
- {"qa_id": "qa_000028", "index_id": "UMI-0028", "query": "What is the course plan for Master of Software Engineering (Software Technology)?", "gold_answer": "The course plan organises the programme across multiple semesters for each intake. The core set includes Research Methodology, Architecting Software Systems, Framework-Based Software Design and Development, Software Verification and Validation, Software Project Management, and Dissertation. Students then select two electives such as Big Data Processing, Requirements Engineering, User Experience Design Studio, Advanced Internet of Things, Advanced Machine Learning, or Security Risk Analysis and Evaluation. The handbook notes that Research Methodology must be taken in the first semester, and dissertation registration requires at least 6 credits of passed coursework together with having taken or being enrolled in Research Methodology.", "plain_answer": "<think>\n\n<source_documents>\n<document>\n <section>\n <pages>\n <page one_page_id=\"int-00001\">\n <orig_source_document_id>SO</orig_source_document_id>\n <section_title>POSTGRADUATE RULEBOOK</section_title>\n <subsection_title>Section III</subsection_title>\n <subsubsection_title>Minimum Grade Requirement for Programme Completion</subsubsubsection_title>\n <p>Students, including the supervisor, must attain a minimum grade of C for all coursework components. For research methodology course, students are required to pass the exam but there is no grade assigned.</p>\n </", "rag_answer": "<think>\n\n</think>\n\nThe course plan organises the programme across multiple semesters for each intake. The core set includes Research Methodology, Architecting Software Systems, Framework-Based Software Design and Development, Software Verification and Validation, Software Project Management, and Dissertation. Students then select two electives such as Big Data Processing, Requirements Engineering, User Experience Design Studio, Advanced Internet of Things, Advanced Machine Learning, or Security Risk Analysis and Evaluation. The handbook notes that Research Methodology must be taken in the first semester, and dissertation registration requires at least 6 credits of passed coursework together with having taken or being enrolled in Research Methodology.", "plain_exact_match": 0.0, "plain_token_f1": 0.125, "rag_exact_match": 0.0, "rag_token_f1": 0.99, "retrieved_kb_ids": ["RAGKB-0404", "RAGKB-0402", "RAGKB-0403"], "retrieved_sections": ["Master of Software Engineering (Software Technology)", "Master of Software Engineering (Software Technology)", "Master of Software Engineering (Software Technology)"], "retrieved_scopes": ["postgraduate", "postgraduate", "postgraduate"]}
14
- {"qa_id": "qa_000972", "index_id": "UMI-0972", "query": "Could you tell me what conditions or achievements make a project eligible for the Excellence Academic Project Award (APAC)?", "gold_answer": "The Excellence Academic Project Award (APAC), introduced in 2012, is an annual event that motivates students to produce excellent projects, recognizes strong systems, identifies good projects for reference and exhibition, and promotes them for competitions, exhibitions, and intellectual property purposes.", "plain_answer": "<think>\n\nOkay, let me check the handbook for the eligibility conditions of the Excellence Academic Project Award (APAC). The user wants to know what conditions or achievements make a project eligible for this award.\n\nLooking at the relevant section, it states that APAC is given to the best academic project in a department or unit, as decided by the Dean. The assessment criteria include the project theme (which must relate to the field of computer science and information technology), presentation skills, and the quality of the project development. \n\nSo, the key eligibility points are:\n1. The project must be among the best in its department or unit.\n2.", "rag_answer": "<think>\n\n</think>\n\nThe Excellence Academic Project Award (APAC), introduced in 2012, is an annual event to motivate students to produce excellent projects. It identifies strong projects for competitions, exhibitions, and intellectual property purposes and selects the best project from each department or unit within a given semester.", "plain_exact_match": 0.0, "plain_token_f1": 0.1892, "rag_exact_match": 0.0, "rag_token_f1": 0.6667, "retrieved_kb_ids": ["RAGKB-0308", "RAGKB-0297", "RAGKB-0296"], "retrieved_sections": ["Academic Project", "Academic Project", "Academic Project"], "retrieved_scopes": ["undergraduate", "undergraduate", "undergraduate"]}
15
- {"qa_id": "qa_000170", "index_id": "UMI-0170", "query": "What facilities and research focus are described for the Robotedge AI Robotic Lab?", "gold_answer": "The Robotedge AI Robotic Lab, previously known as the Natural Language Processing Lab, is equipped for AI robotics research and development, especially in environmental, home services, and search-and-rescue areas.", "plain_answer": "<think>\n\nOkay, let me check the handbook for information about the Robotedge AI Robotic Lab. The user wants to know the facilities and research focus described there.\n\n[Searches the retrieved handbook evidence]\n\nThe handbook states that the Robotedge AI Robotic Lab is equipped with six mobile robots and focuses on AI-based robotics research. Its key research areas include robotic perception, human–robot interaction, robotic manipulation, and AI-based autonomous navigation.\n\nSo, the answer should mention the six mobile robots as the main facility and list the four research areas. Make sure to keep it faithful to the handbook.", "rag_answer": "<think>\n\n</think>\n\nThe Robotedge AI Robotic Lab, previously known as the Natural Language Processing Lab, is equipped for AI robotics research and development, especially in environmental, home services, and search-and-rescue areas.", "plain_exact_match": 0.0, "plain_token_f1": 0.2769, "rag_exact_match": 0.0, "rag_token_f1": 0.9688, "retrieved_kb_ids": ["RAGKB-0017", "RAGKB-0019", "RAGKB-0016"], "retrieved_sections": ["Teaching and Learning Facilities", "Teaching and Learning Facilities", "Teaching and Learning Facilities"], "retrieved_scopes": ["general", "general", "general"]}
16
- {"qa_id": "qa_000914", "index_id": "UMI-0914", "query": "Could you explain how should students interpret or use the programme core courses list when planning their studies?", "gold_answer": "Students should use the programme core courses list as compulsory study-planning guidance: they are expected to pass all Faculty and Programme Core courses and to check the stated course prerequisites, with Industrial Training treated separately in the prerequisite note.", "plain_answer": "<think>\n\nOkay, so the user is asking how students should interpret or use the Programme Core Courses list when planning their studies. Let me check the retrieved evidence first.\n\nThe handbook says that the Programme Core Courses list includes courses compulsory for all postgraduate study plans and must be taken in the first semester. It also notes that students must check the current list provided by the department. \n\nHmm, the user probably wants to know if they should use that list as a mandatory checklist, when to take those courses, and maybe how it interacts with other course lists. The answer should clarify that the core courses are compulsory, must be taken in the first", "rag_answer": "<think>\n\n</think>\n\nStudents should use the programme core courses list as the required study component part of their study plan. They must complete all listed compulsory courses and use the course list together with the later handbook section for course sequencing and planning.", "plain_exact_match": 0.0, "plain_token_f1": 0.3613, "rag_exact_match": 0.0, "rag_token_f1": 0.506, "retrieved_kb_ids": ["RAGKB-0185", "RAGKB-0186", "RAGKB-0184"], "retrieved_sections": ["Shared Undergraduate Curriculum", "Shared Undergraduate Curriculum", "Shared Undergraduate Curriculum"], "retrieved_scopes": ["undergraduate", "undergraduate", "undergraduate"]}
17
- {"qa_id": "qa_000651", "index_id": "UMI-0651", "query": "Could you tell me what facilities and access arrangements are described for the Postgraduate Lab (ML)?", "gold_answer": "The Postgraduate Lab has 33 computer units connected to Windows Active Directory servers and the Internet, uses Windows 10, and is open to all FSKTM postgraduate students.", "plain_answer": "<think>\n\nOkay, let me check the handbook for the Postgraduate Lab (ML). The user is asking about the facilities and access arrangements listed there.\n\n[Retrieved Evidence 1]\nSource document: Complete Handbook\nScope: postgraduate\nSection: Laboratory Regulations and Support\nSubsection: Laboratory Regulations and Support\nPages: 303\nKnowledge group: KG-0085\nChunk id: SC-00304\nText:\n7. Users are not allowed to install any applications and data. 8. Users are prohibited from bringing in external data disks (e.g. ZX, CD, memory stick", "rag_answer": "<think>\n\n</think>\n\nThe Postgraduate Lab has 33 computer units connected to Windows Active Directory servers and the Internet, uses Windows 10, and is open to all FSKTM postgraduate students.", "plain_exact_match": 0.0, "plain_token_f1": 0.1667, "rag_exact_match": 0.0, "rag_token_f1": 0.9643, "retrieved_kb_ids": ["RAGKB-0010", "RAGKB-0012", "RAGKB-0011"], "retrieved_sections": ["Teaching and Learning Facilities", "Teaching and Learning Facilities", "Teaching and Learning Facilities"], "retrieved_scopes": ["general", "general", "general"]}
18
- {"qa_id": "qa_000292", "index_id": "UMI-0292", "query": "What rules apply to saving data, using personal devices, or protecting laboratory resources?", "gold_answer": "The laboratory regulations prohibit misuse of laboratory facilities, disruptive or improper behaviour, and conduct that may damage equipment, compromise safety, or interfere with other users.", "plain_answer": "<think>\n\nOkay, so the user is asking about rules related to saving data, using personal devices, and protecting lab resources. Let me check the handbook.\n\n[Retrieved Evidence 1]\nSource document: Complete Handbook\nScope: general\nSection: General Laboratory Regulations\nSubsection: Laboratory Regulations\nKeywords page: 211\nPages: 211\nChunk id: SC-00014\nText:\nREFERENCE: GENERAL LABORATORY REGULATIONS at: http://aasd.fsktm.um.edu.my LAMPED RESEARCH AND LABORATORY REGULATIONS https://nuruzzaman.we", "rag_answer": "<think>\n\n</think>\n\nThe laboratory regulations prohibit misuse of laboratory facilities, disruptive or improper behaviour, and conduct that may damage equipment, compromise safety, or interfere with other users.", "plain_exact_match": 0.0, "plain_token_f1": 0.1053, "rag_exact_match": 0.0, "rag_token_f1": 0.9615, "retrieved_kb_ids": ["RAGKB-0139", "RAGKB-0140", "RAGKB-0141"], "retrieved_sections": ["Laboratory Regulations and Support", "Laboratory Regulations and Support", "Laboratory Regulations and Support"], "retrieved_scopes": ["general", "general", "general"]}
19
- {"qa_id": "qa_000525", "index_id": "UMI-0525", "query": "Could you tell me what curriculum structure or course planning information is shown for Bachelor of Computer Science (Computer System and Network)?", "gold_answer": "The curriculum structure semester by semester, showing how university courses, faculty core courses, programme core courses, specialization electives, industrial training, and the academic project fit into the degree plan.", "plain_answer": "<think>\n\nOkay, let me check the retrieved document for the Bachelor of Computer Science (Computer System and Network) programme. The user is asking about the curriculum structure and course planning information.\n\nFirst, I'll look for a section that outlines the curriculum. The document mentions a curriculum structure divided into eight courses, including university courses, faculty core electives, programme core courses, and specialization electives. That gives a general framework.\n\nNext, course planning is usually presented by semester. The Bachelor of Computer Science curriculum has 80 credits of fixed credits, spread across four years. Semester 1 has three subjects: one compulsory university course (PP", "rag_answer": "<think>\n\n</think>\n\nThe curriculum structure semester by semester, showing how university courses, faculty core courses, programme core courses, specialization electives, industrial training, and the academic project fit into the degree plan.", "plain_exact_match": 0.0, "plain_token_f1": 0.303, "rag_exact_match": 0.0, "rag_token_f1": 0.9667, "retrieved_kb_ids": ["RAGKB-0324", "RAGKB-0322", "RAGKB-0325"], "retrieved_sections": ["Undergraduate Programme Goals and Learning Outcomes", "Undergraduate Programme Goals and Learning Outcomes", "Undergraduate Programme Goals and Learning Outcomes"], "retrieved_scopes": ["undergraduate", "undergraduate", "undergraduate"]}
20
- {"qa_id": "qa_000673", "index_id": "UMI-0673", "query": "Hey, what facilities and access arrangements are described for the Knowledge Engineering Lab?", "gold_answer": "The Knowledge Engineering Lab is an open-space concept lab at Wisma R&D that is accessible to all postgraduate students, regardless of field, with permission for access.", "plain_answer": "<think>\n\nOkay, let me check the retrieved evidence about the Knowledge Engineering Lab. The user is asking about its facilities and access arrangements.\n\nFirst, the handbook states that the lab is located on the 15th floor of Wisma R&D and has 30 units of computer equipment. It's equipped with tools for knowledge engineering tasks such as the Python programming language, TensorFlow, SPARQL endpoints, knowledge graph visualization, and tools for ontology merging, reasoning, and semantic annotation. The text also mentions that internet access is provided and that users must follow the lab rules, including registration, prohibition of bringing in outsiders, and accountability for", "rag_answer": "<think>\n\n</think>\n\nThe Knowledge Engineering Lab is an open-space concept lab at Wisma R&D that is accessible to all postgraduate students, regardless of field, with permission for access.", "plain_exact_match": 0.0, "plain_token_f1": 0.2273, "rag_exact_match": 0.0, "rag_token_f1": 0.9655, "retrieved_kb_ids": ["RAGKB-0016", "RAGKB-0017", "RAGKB-0015"], "retrieved_sections": ["Teaching and Learning Facilities", "Teaching and Learning Facilities", "Teaching and Learning Facilities"], "retrieved_scopes": ["general", "general", "general"]}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/generation_eval/generation_metrics.json DELETED
@@ -1,10 +0,0 @@
1
- {
2
- "generation_eval_size": 20,
3
- "top_k": 3,
4
- "plain_exact_match": 0.0,
5
- "plain_token_f1": 0.2353,
6
- "rag_exact_match": 0.0,
7
- "rag_token_f1": 0.7842,
8
- "rag_minus_plain_exact_match": 0.0,
9
- "rag_minus_plain_token_f1": 0.549
10
- }
 
 
 
 
 
 
 
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/lora_adapter/README.md DELETED
@@ -1,209 +0,0 @@
1
- ---
2
- base_model: /scr/user/kevin2002/TensorCat/NLP/UM_Handbook/models/Qwen3-8B
3
- library_name: peft
4
- pipeline_tag: text-generation
5
- tags:
6
- - base_model:adapter:/scr/user/kevin2002/TensorCat/NLP/UM_Handbook/models/Qwen3-8B
7
- - lora
8
- - sft
9
- - transformers
10
- - trl
11
- ---
12
-
13
- # Model Card for Model ID
14
-
15
- <!-- Provide a quick summary of what the model is/does. -->
16
-
17
-
18
-
19
- ## Model Details
20
-
21
- ### Model Description
22
-
23
- <!-- Provide a longer summary of what this model is. -->
24
-
25
-
26
-
27
- - **Developed by:** [More Information Needed]
28
- - **Funded by [optional]:** [More Information Needed]
29
- - **Shared by [optional]:** [More Information Needed]
30
- - **Model type:** [More Information Needed]
31
- - **Language(s) (NLP):** [More Information Needed]
32
- - **License:** [More Information Needed]
33
- - **Finetuned from model [optional]:** [More Information Needed]
34
-
35
- ### Model Sources [optional]
36
-
37
- <!-- Provide the basic links for the model. -->
38
-
39
- - **Repository:** [More Information Needed]
40
- - **Paper [optional]:** [More Information Needed]
41
- - **Demo [optional]:** [More Information Needed]
42
-
43
- ## Uses
44
-
45
- <!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
46
-
47
- ### Direct Use
48
-
49
- <!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
50
-
51
- [More Information Needed]
52
-
53
- ### Downstream Use [optional]
54
-
55
- <!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
56
-
57
- [More Information Needed]
58
-
59
- ### Out-of-Scope Use
60
-
61
- <!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
62
-
63
- [More Information Needed]
64
-
65
- ## Bias, Risks, and Limitations
66
-
67
- <!-- This section is meant to convey both technical and sociotechnical limitations. -->
68
-
69
- [More Information Needed]
70
-
71
- ### Recommendations
72
-
73
- <!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
74
-
75
- Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
76
-
77
- ## How to Get Started with the Model
78
-
79
- Use the code below to get started with the model.
80
-
81
- [More Information Needed]
82
-
83
- ## Training Details
84
-
85
- ### Training Data
86
-
87
- <!-- This should link to a Dataset Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
88
-
89
- [More Information Needed]
90
-
91
- ### Training Procedure
92
-
93
- <!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
94
-
95
- #### Preprocessing [optional]
96
-
97
- [More Information Needed]
98
-
99
-
100
- #### Training Hyperparameters
101
-
102
- - **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
103
-
104
- #### Speeds, Sizes, Times [optional]
105
-
106
- <!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
107
-
108
- [More Information Needed]
109
-
110
- ## Evaluation
111
-
112
- <!-- This section describes the evaluation protocols and provides the results. -->
113
-
114
- ### Testing Data, Factors & Metrics
115
-
116
- #### Testing Data
117
-
118
- <!-- This should link to a Dataset Card if possible. -->
119
-
120
- [More Information Needed]
121
-
122
- #### Factors
123
-
124
- <!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
125
-
126
- [More Information Needed]
127
-
128
- #### Metrics
129
-
130
- <!-- These are the evaluation metrics being used, ideally with a description of why. -->
131
-
132
- [More Information Needed]
133
-
134
- ### Results
135
-
136
- [More Information Needed]
137
-
138
- #### Summary
139
-
140
-
141
-
142
- ## Model Examination [optional]
143
-
144
- <!-- Relevant interpretability work for the model goes here -->
145
-
146
- [More Information Needed]
147
-
148
- ## Environmental Impact
149
-
150
- <!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
151
-
152
- Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
153
-
154
- - **Hardware Type:** [More Information Needed]
155
- - **Hours used:** [More Information Needed]
156
- - **Cloud Provider:** [More Information Needed]
157
- - **Compute Region:** [More Information Needed]
158
- - **Carbon Emitted:** [More Information Needed]
159
-
160
- ## Technical Specifications [optional]
161
-
162
- ### Model Architecture and Objective
163
-
164
- [More Information Needed]
165
-
166
- ### Compute Infrastructure
167
-
168
- [More Information Needed]
169
-
170
- #### Hardware
171
-
172
- [More Information Needed]
173
-
174
- #### Software
175
-
176
- [More Information Needed]
177
-
178
- ## Citation [optional]
179
-
180
- <!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
181
-
182
- **BibTeX:**
183
-
184
- [More Information Needed]
185
-
186
- **APA:**
187
-
188
- [More Information Needed]
189
-
190
- ## Glossary [optional]
191
-
192
- <!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
193
-
194
- [More Information Needed]
195
-
196
- ## More Information [optional]
197
-
198
- [More Information Needed]
199
-
200
- ## Model Card Authors [optional]
201
-
202
- [More Information Needed]
203
-
204
- ## Model Card Contact
205
-
206
- [More Information Needed]
207
- ### Framework versions
208
-
209
- - PEFT 0.18.1
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/lora_adapter/adapter_config.json DELETED
@@ -1,46 +0,0 @@
1
- {
2
- "alora_invocation_tokens": null,
3
- "alpha_pattern": {},
4
- "arrow_config": null,
5
- "auto_mapping": null,
6
- "base_model_name_or_path": "/scr/user/kevin2002/TensorCat/NLP/UM_Handbook/models/Qwen3-8B",
7
- "bias": "none",
8
- "corda_config": null,
9
- "ensure_weight_tying": false,
10
- "eva_config": null,
11
- "exclude_modules": null,
12
- "fan_in_fan_out": false,
13
- "inference_mode": true,
14
- "init_lora_weights": true,
15
- "layer_replication": null,
16
- "layers_pattern": null,
17
- "layers_to_transform": null,
18
- "loftq_config": {},
19
- "lora_alpha": 16,
20
- "lora_bias": false,
21
- "lora_dropout": 0.05,
22
- "megatron_config": null,
23
- "megatron_core": "megatron.core",
24
- "modules_to_save": null,
25
- "peft_type": "LORA",
26
- "peft_version": "0.18.1",
27
- "qalora_group_size": 16,
28
- "r": 8,
29
- "rank_pattern": {},
30
- "revision": null,
31
- "target_modules": [
32
- "o_proj",
33
- "up_proj",
34
- "q_proj",
35
- "down_proj",
36
- "k_proj",
37
- "v_proj",
38
- "gate_proj"
39
- ],
40
- "target_parameters": null,
41
- "task_type": "CAUSAL_LM",
42
- "trainable_token_indices": null,
43
- "use_dora": false,
44
- "use_qalora": false,
45
- "use_rslora": false
46
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/lora_adapter/adapter_model.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:6833958e7d1e52733a02c8675c398188d65dd02aed1c0cd026a6235c32247d7d
3
- size 87360584
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/lora_adapter/chat_template.jinja DELETED
@@ -1,89 +0,0 @@
1
- {%- if tools %}
2
- {{- '<|im_start|>system\n' }}
3
- {%- if messages[0].role == 'system' %}
4
- {{- messages[0].content + '\n\n' }}
5
- {%- endif %}
6
- {{- "# Tools\n\nYou may call one or more functions to assist with the user query.\n\nYou are provided with function signatures within <tools></tools> XML tags:\n<tools>" }}
7
- {%- for tool in tools %}
8
- {{- "\n" }}
9
- {{- tool | tojson }}
10
- {%- endfor %}
11
- {{- "\n</tools>\n\nFor each function call, return a json object with function name and arguments within <tool_call></tool_call> XML tags:\n<tool_call>\n{\"name\": <function-name>, \"arguments\": <args-json-object>}\n</tool_call><|im_end|>\n" }}
12
- {%- else %}
13
- {%- if messages[0].role == 'system' %}
14
- {{- '<|im_start|>system\n' + messages[0].content + '<|im_end|>\n' }}
15
- {%- endif %}
16
- {%- endif %}
17
- {%- set ns = namespace(multi_step_tool=true, last_query_index=messages|length - 1) %}
18
- {%- for message in messages[::-1] %}
19
- {%- set index = (messages|length - 1) - loop.index0 %}
20
- {%- if ns.multi_step_tool and message.role == "user" and message.content is string and not(message.content.startswith('<tool_response>') and message.content.endswith('</tool_response>')) %}
21
- {%- set ns.multi_step_tool = false %}
22
- {%- set ns.last_query_index = index %}
23
- {%- endif %}
24
- {%- endfor %}
25
- {%- for message in messages %}
26
- {%- if message.content is string %}
27
- {%- set content = message.content %}
28
- {%- else %}
29
- {%- set content = '' %}
30
- {%- endif %}
31
- {%- if (message.role == "user") or (message.role == "system" and not loop.first) %}
32
- {{- '<|im_start|>' + message.role + '\n' + content + '<|im_end|>' + '\n' }}
33
- {%- elif message.role == "assistant" %}
34
- {%- set reasoning_content = '' %}
35
- {%- if message.reasoning_content is string %}
36
- {%- set reasoning_content = message.reasoning_content %}
37
- {%- else %}
38
- {%- if '</think>' in content %}
39
- {%- set reasoning_content = content.split('</think>')[0].rstrip('\n').split('<think>')[-1].lstrip('\n') %}
40
- {%- set content = content.split('</think>')[-1].lstrip('\n') %}
41
- {%- endif %}
42
- {%- endif %}
43
- {%- if loop.index0 > ns.last_query_index %}
44
- {%- if loop.last or (not loop.last and reasoning_content) %}
45
- {{- '<|im_start|>' + message.role + '\n<think>\n' + reasoning_content.strip('\n') + '\n</think>\n\n' + content.lstrip('\n') }}
46
- {%- else %}
47
- {{- '<|im_start|>' + message.role + '\n' + content }}
48
- {%- endif %}
49
- {%- else %}
50
- {{- '<|im_start|>' + message.role + '\n' + content }}
51
- {%- endif %}
52
- {%- if message.tool_calls %}
53
- {%- for tool_call in message.tool_calls %}
54
- {%- if (loop.first and content) or (not loop.first) %}
55
- {{- '\n' }}
56
- {%- endif %}
57
- {%- if tool_call.function %}
58
- {%- set tool_call = tool_call.function %}
59
- {%- endif %}
60
- {{- '<tool_call>\n{"name": "' }}
61
- {{- tool_call.name }}
62
- {{- '", "arguments": ' }}
63
- {%- if tool_call.arguments is string %}
64
- {{- tool_call.arguments }}
65
- {%- else %}
66
- {{- tool_call.arguments | tojson }}
67
- {%- endif %}
68
- {{- '}\n</tool_call>' }}
69
- {%- endfor %}
70
- {%- endif %}
71
- {{- '<|im_end|>\n' }}
72
- {%- elif message.role == "tool" %}
73
- {%- if loop.first or (messages[loop.index0 - 1].role != "tool") %}
74
- {{- '<|im_start|>user' }}
75
- {%- endif %}
76
- {{- '\n<tool_response>\n' }}
77
- {{- content }}
78
- {{- '\n</tool_response>' }}
79
- {%- if loop.last or (messages[loop.index0 + 1].role != "tool") %}
80
- {{- '<|im_end|>\n' }}
81
- {%- endif %}
82
- {%- endif %}
83
- {%- endfor %}
84
- {%- if add_generation_prompt %}
85
- {{- '<|im_start|>assistant\n' }}
86
- {%- if enable_thinking is defined and enable_thinking is false %}
87
- {{- '<think>\n\n</think>\n\n' }}
88
- {%- endif %}
89
- {%- endif %}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/lora_adapter/tokenizer.json DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:be75606093db2094d7cd20f3c2f385c212750648bd6ea4fb2bf507a6a4c55506
3
- size 11422650
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/lora_adapter/tokenizer_config.json DELETED
@@ -1,29 +0,0 @@
1
- {
2
- "add_prefix_space": false,
3
- "backend": "tokenizers",
4
- "bos_token": null,
5
- "clean_up_tokenization_spaces": false,
6
- "eos_token": "<|im_end|>",
7
- "errors": "replace",
8
- "extra_special_tokens": [
9
- "<|im_start|>",
10
- "<|im_end|>",
11
- "<|object_ref_start|>",
12
- "<|object_ref_end|>",
13
- "<|box_start|>",
14
- "<|box_end|>",
15
- "<|quad_start|>",
16
- "<|quad_end|>",
17
- "<|vision_start|>",
18
- "<|vision_end|>",
19
- "<|vision_pad|>",
20
- "<|image_pad|>",
21
- "<|video_pad|>"
22
- ],
23
- "is_local": true,
24
- "model_max_length": 131072,
25
- "pad_token": "<|endoftext|>",
26
- "split_special_tokens": false,
27
- "tokenizer_class": "Qwen2Tokenizer",
28
- "unk_token": null
29
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/lora_adapter/training_args.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:1e28aed9c09299882a0a85d4a5e7b5f033f6f0f96c839015b54f530ff1cc1760
3
- size 5368
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/rag_augmented_dataset/rag_augmented_sft_dataset.jsonl DELETED
The diff for this file is too large to render. See raw diff
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/rag_augmented_dataset/rag_augmented_sft_dataset_preview.json DELETED
@@ -1,212 +0,0 @@
1
- [
2
- {
3
- "qa_id": "qa_000001",
4
- "index_id": "UMI-0001",
5
- "question": "What are the faculty objectives?",
6
- "answer": "The faculty objectives are to sustain excellence in undergraduate and postgraduate teaching, learning, and research; contribute to national development through quality research and publications; provide innovative academic programmes that respond to societal needs; and produce quality graduates with advanced knowledge and skills in computer science and information technology.",
7
- "scope_label": "general",
8
- "source_doc": "General Handbook",
9
- "section": "Faculty Objectives",
10
- "subsection": "Faculty Objectives",
11
- "retrieved_kb_ids": [
12
- "RAGKB-0001",
13
- "RAGKB-0515",
14
- "RAGKB-0504"
15
- ],
16
- "retrieved_sections": [
17
- "Faculty Objectives",
18
- "Doctor of Philosophy",
19
- "Master of Computer Science (By Research)"
20
- ],
21
- "retrieved_scopes": [
22
- "general",
23
- "postgraduate",
24
- "postgraduate"
25
- ],
26
- "prompt": [
27
- {
28
- "role": "system",
29
- "content": "You are an academic assistant for the Faculty of Computer Science and Information Technology, Universiti Malaya. Answer only with handbook-grounded information. Use the retrieved handbook evidence when it is provided. Keep the answer direct, specific, and faithful to the handbook. If the evidence does not support a claim, say so clearly and briefly."
30
- },
31
- {
32
- "role": "user",
33
- "content": "Use the retrieved handbook evidence to answer the question. Base the answer on the evidence and keep it faithful to the handbook.\n\n[Retrieved Evidence 1]\nSource document: General Handbook\nScope: general\nSection: Faculty Objectives\nSubsection: Faculty Objectives\nPages: 9\nKnowledge group: KG-0009\nChunk id: SC-00001\nText:\nVISION A global faculty impacting the world MISSION Propelling computing technology and producing world class leaders OBJECTIVES To sustain an outstanding faculty dedicated to excellence in undergraduate and postgraduate teaching, learning and research. To contribute towards the development of the nation through the production of quality research and publications. To provide innovative academic programs that can respond to the changing needs of the society. To produce quality graduates who are equipped with advanced knowledge and skills of computer science and information technology.\n\n[Retrieved Evidence 2]\nSource document: Complete Handbook\nScope: postgraduate\nSection: Doctor of Philosophy\nSubsection: Programme Education Objectives\nPages: 121\nKnowledge group: KG-0021\nChunk id: SC-00515\nText:\nPROGRAMME EDUCATION OBJETIVES oe PEO 1: Foster innovation of new ideas, methods and techniques in relevant research fields PEO 2: Lead research and establish a career as a skilled researcher and/or practitioner PEO 3. Disseminate research output and provide expert advice through various mechanisms in an ethical and professional manner\n\n[Retrieved Evidence 3]\nSource document: Complete Handbook\nScope: postgraduate\nSection: Master of Computer Science (By Research)\nSubsection: Learning Objectives and Outcomes\nPages: 114\nKnowledge group: KG-0039\nChunk id: SC-00504\nText:\nPROGRAMME LEARNING OBJECTIVES & OUTCOMES SS PROGRAMME EDUCATIONAL OBJECTIVES (PEO) 4. To produce researchers who can contribute to the development and knowledge of computer science 2. To produce professionals in computer science research 3. To equip graduates with technical and soft skills PROGRAMME LEARNING OUTCOMES (PLO) Taxonomic No. Programme Learning Outcomes PLOs Gubecte 1. [Apply and integrate knowledge on the latest research issues |p) Gy 3S in computer science and produce state-of-the-art research. 2. [Evaluate and analyse computing solutions in terms of re Pp usability, efficiency and effectiveness 3. [Produce computing solutions and use appropriate tools to lanalyse the performanc ...[truncated]\n\nQuestion: What are the faculty objectives?"
34
- }
35
- ],
36
- "completion": [
37
- {
38
- "role": "assistant",
39
- "content": "The faculty objectives are to sustain excellence in undergraduate and postgraduate teaching, learning, and research; contribute to national development through quality research and publications; provide innovative academic programmes that respond to societal needs; and produce quality graduates with advanced knowledge and skills in computer science and information technology."
40
- }
41
- ],
42
- "text": "<|im_start|>system\nYou are an academic assistant for the Faculty of Computer Science and Information Technology, Universiti Malaya. Answer only with handbook-grounded information. Use the retrieved handbook evidence when it is provided. Keep the answer direct, specific, and faithful to the handbook. If the evidence does not support a claim, say so clearly and briefly.<|im_end|>\n<|im_start|>user\nUse the retrieved handbook evidence to answer the question. Base the answer on the evidence and keep it faithful to the handbook.\n\n[Retrieved Evidence 1]\nSource document: General Handbook\nScope: general\nSection: Faculty Objectives\nSubsection: Faculty Objectives\nPages: 9\nKnowledge group: KG-0009\nChunk id: SC-00001\nText:\nVISION A global faculty impacting the world MISSION Propelling computing technology and producing world class leaders OBJECTIVES To sustain an outstanding faculty dedicated to excellence in undergraduate and postgraduate teaching, learning and research. To contribute towards the development of the nation through the production of quality research and publications. To provide innovative academic programs that can respond to the changing needs of the society. To produce quality graduates who are equipped with advanced knowledge and skills of computer science and information technology.\n\n[Retrieved Evidence 2]\nSource document: Complete Handbook\nScope: postgraduate\nSection: Doctor of Philosophy\nSubsection: Programme Education Objectives\nPages: 121\nKnowledge group: KG-0021\nChunk id: SC-00515\nText:\nPROGRAMME EDUCATION OBJETIVES oe PEO 1: Foster innovation of new ideas, methods and techniques in relevant research fields PEO 2: Lead research and establish a career as a skilled researcher and/or practitioner PEO 3. Disseminate research output and provide expert advice through various mechanisms in an ethical and professional manner\n\n[Retrieved Evidence 3]\nSource document: Complete Handbook\nScope: postgraduate\nSection: Master of Computer Science (By Research)\nSubsection: Learning Objectives and Outcomes\nPages: 114\nKnowledge group: KG-0039\nChunk id: SC-00504\nText:\nPROGRAMME LEARNING OBJECTIVES & OUTCOMES SS PROGRAMME EDUCATIONAL OBJECTIVES (PEO) 4. To produce researchers who can contribute to the development and knowledge of computer science 2. To produce professionals in computer science research 3. To equip graduates with technical and soft skills PROGRAMME LEARNING OUTCOMES (PLO) Taxonomic No. Programme Learning Outcomes PLOs Gubecte 1. [Apply and integrate knowledge on the latest research issues |p) Gy 3S in computer science and produce state-of-the-art research. 2. [Evaluate and analyse computing solutions in terms of re Pp usability, efficiency and effectiveness 3. [Produce computing solutions and use appropriate tools to lanalyse the performanc ...[truncated]\n\nQuestion: What are the faculty objectives?<|im_end|>\n<|im_start|>assistant\n<think>\n\n</think>\n\nThe faculty objectives are to sustain excellence in undergraduate and postgraduate teaching, learning, and research; contribute to national development through quality research and publications; provide innovative academic programmes that respond to societal needs; and produce quality graduates with advanced knowledge and skills in computer science and information technology.<|im_end|>\n"
43
- },
44
- {
45
- "qa_id": "qa_000002",
46
- "index_id": "UMI-0002",
47
- "question": "What is the history overview of the Faculty of Computer Science and Information Technology?",
48
- "answer": "Universiti Malaya's computing facilities began with the Computer Centre in the 1960s, later expanded into teaching and research, introduced the Diploma in Computer Science in 1974 and research degrees in 1985, then moved toward a full faculty structure in 1993. FCSIT was formally approved in 1994, its main building was opened in 1996, the Bachelor of Information Technology began in 1996/97, and four departments were established in 1997.",
49
- "scope_label": "general",
50
- "source_doc": "General Handbook",
51
- "section": "History of the Faculty",
52
- "subsection": "History Overview",
53
- "retrieved_kb_ids": [
54
- "RAGKB-0004",
55
- "RAGKB-0003",
56
- "RAGKB-0002"
57
- ],
58
- "retrieved_sections": [
59
- "History of the Faculty",
60
- "History of the Faculty",
61
- "History of the Faculty"
62
- ],
63
- "retrieved_scopes": [
64
- "general",
65
- "general",
66
- "general"
67
- ],
68
- "prompt": [
69
- {
70
- "role": "system",
71
- "content": "You are an academic assistant for the Faculty of Computer Science and Information Technology, Universiti Malaya. Answer only with handbook-grounded information. Use the retrieved handbook evidence when it is provided. Keep the answer direct, specific, and faithful to the handbook. If the evidence does not support a claim, say so clearly and briefly."
72
- },
73
- {
74
- "role": "user",
75
- "content": "Use the retrieved handbook evidence to answer the question. Base the answer on the evidence and keep it faithful to the handbook.\n\n[Retrieved Evidence 1]\nSource document: General Handbook\nScope: general\nSection: History of the Faculty\nSubsection: History Overview\nPages: 11\nKnowledge group: KG-0011\nChunk id: SC-00004\nText:\nThe Bachelor of Information Technology programme started in the 1996/1997 Session, with an initial intake of 50 students. To accommodate an increase student population, an additional building was built which was officially opened by Datuk Fong Chan Onn, Deputy Minister of Education on September 21st, 1998. Since its establishment, the Faculty of Computer Science and Information Technology have been led by a number of distinguished persons. The following have served as Directors/Dean: HISTORY OF THE FACULTY 1967 – 1973 1973 – 1975 1975 – 1978 1978 – 1982 1982 – 1990 1990 – 1992 1992 – 2000 2000 – 2002 2002 – 2004 2004 – 2005 2005 – 2006 2006 – 2007 2007 – 2009 2009 – 2010 2010 – 2011 2011 – 2 ...[truncated]\n\n[Retrieved Evidence 2]\nSource document: General Handbook\nScope: general\nSection: History of the Faculty\nSubsection: History Overview\nPages: 10\nKnowledge group: KG-0011\nChunk id: SC-00003\nText:\nprogramme. The first undergraduate enrolment for the 1990/1991 Session was 50 students. In April 1st, 1993, the University Senate agreed to the formation of the Computer Centre Study Board. The Board proposed the establishment of a faculty to be called the Faculty of Computer Science and Information Technology (FCSIT). The existing Computer Centre was to be annulled and replaced by a Computer Services Division which was placed under the Chancellery. On September 22nd, 1994, the University of Malaya Council agreed to the formation of the Faculty of Computer Science and Information Technology (FCSIT), and the Computer Services Division. A sum of 4.2 million was obtained from the Ministry of Ed ...[truncated]\n\n[Retrieved Evidence 3]\nSource document: General Handbook\nScope: general\nSection: History of the Faculty\nSubsection: History Overview\nPages: 10\nKnowledge group: KG-0011\nChunk id: SC-00002\nText:\nThe provision of computer facilities and services at the Universiti Malaya (UM) began soon after the Computer Centre was officially formed in 1965. This made the university one of the pioneers in computer usage in Malaysia. In December 1969, the Computer Centre took on an additional role of teaching and research of computer science and information technology. The Computer Centre Board was formed, comprising the Vice-Chancellor (as Chairman), the Director of Computer Centre (as Secretary), and a representative from each Faculty, Institute, Centre and the University Senate. In 1974, the Diploma in Computer Science programme was introduced. From its inception in the 1974/1975 Session to the 199 ...[truncated]\n\nQuestion: What is the history overview of the Faculty of Computer Science and Information Technology?"
76
- }
77
- ],
78
- "completion": [
79
- {
80
- "role": "assistant",
81
- "content": "Universiti Malaya's computing facilities began with the Computer Centre in the 1960s, later expanded into teaching and research, introduced the Diploma in Computer Science in 1974 and research degrees in 1985, then moved toward a full faculty structure in 1993. FCSIT was formally approved in 1994, its main building was opened in 1996, the Bachelor of Information Technology began in 1996/97, and four departments were established in 1997."
82
- }
83
- ],
84
- "text": "<|im_start|>system\nYou are an academic assistant for the Faculty of Computer Science and Information Technology, Universiti Malaya. Answer only with handbook-grounded information. Use the retrieved handbook evidence when it is provided. Keep the answer direct, specific, and faithful to the handbook. If the evidence does not support a claim, say so clearly and briefly.<|im_end|>\n<|im_start|>user\nUse the retrieved handbook evidence to answer the question. Base the answer on the evidence and keep it faithful to the handbook.\n\n[Retrieved Evidence 1]\nSource document: General Handbook\nScope: general\nSection: History of the Faculty\nSubsection: History Overview\nPages: 11\nKnowledge group: KG-0011\nChunk id: SC-00004\nText:\nThe Bachelor of Information Technology programme started in the 1996/1997 Session, with an initial intake of 50 students. To accommodate an increase student population, an additional building was built which was officially opened by Datuk Fong Chan Onn, Deputy Minister of Education on September 21st, 1998. Since its establishment, the Faculty of Computer Science and Information Technology have been led by a number of distinguished persons. The following have served as Directors/Dean: HISTORY OF THE FACULTY 1967 – 1973 1973 – 1975 1975 – 1978 1978 – 1982 1982 – 1990 1990 – 1992 1992 – 2000 2000 – 2002 2002 – 2004 2004 – 2005 2005 – 2006 2006 – 2007 2007 – 2009 2009 – 2010 2010 – 2011 2011 – 2 ...[truncated]\n\n[Retrieved Evidence 2]\nSource document: General Handbook\nScope: general\nSection: History of the Faculty\nSubsection: History Overview\nPages: 10\nKnowledge group: KG-0011\nChunk id: SC-00003\nText:\nprogramme. The first undergraduate enrolment for the 1990/1991 Session was 50 students. In April 1st, 1993, the University Senate agreed to the formation of the Computer Centre Study Board. The Board proposed the establishment of a faculty to be called the Faculty of Computer Science and Information Technology (FCSIT). The existing Computer Centre was to be annulled and replaced by a Computer Services Division which was placed under the Chancellery. On September 22nd, 1994, the University of Malaya Council agreed to the formation of the Faculty of Computer Science and Information Technology (FCSIT), and the Computer Services Division. A sum of 4.2 million was obtained from the Ministry of Ed ...[truncated]\n\n[Retrieved Evidence 3]\nSource document: General Handbook\nScope: general\nSection: History of the Faculty\nSubsection: History Overview\nPages: 10\nKnowledge group: KG-0011\nChunk id: SC-00002\nText:\nThe provision of computer facilities and services at the Universiti Malaya (UM) began soon after the Computer Centre was officially formed in 1965. This made the university one of the pioneers in computer usage in Malaysia. In December 1969, the Computer Centre took on an additional role of teaching and research of computer science and information technology. The Computer Centre Board was formed, comprising the Vice-Chancellor (as Chairman), the Director of Computer Centre (as Secretary), and a representative from each Faculty, Institute, Centre and the University Senate. In 1974, the Diploma in Computer Science programme was introduced. From its inception in the 1974/1975 Session to the 199 ...[truncated]\n\nQuestion: What is the history overview of the Faculty of Computer Science and Information Technology?<|im_end|>\n<|im_start|>assistant\n<think>\n\n</think>\n\nUniversiti Malaya's computing facilities began with the Computer Centre in the 1960s, later expanded into teaching and research, introduced the Diploma in Computer Science in 1974 and research degrees in 1985, then moved toward a full faculty structure in 1993. FCSIT was formally approved in 1994, its main building was opened in 1996, the Bachelor of Information Technology began in 1996/97, and four departments were established in 1997.<|im_end|>\n"
85
- },
86
- {
87
- "qa_id": "qa_000003",
88
- "index_id": "UMI-0003",
89
- "question": "What key milestones are mentioned in the faculty history?",
90
- "answer": "Key milestones include the formation of the Computer Centre, the start of teaching and research in 1969, the introduction of the Diploma in Computer Science in 1974, approval and administration of the Master of Computer Science and PhD research programmes in 1985, the 1993 proposal to establish FCSIT, formal approval in 1994, the opening of the faculty building in 1996, the start of the Bachelor of Information Technology in 1996/97, and the establishment of four departments in 1997.",
91
- "scope_label": "general",
92
- "source_doc": "General Handbook",
93
- "section": "History of the Faculty",
94
- "subsection": "History Overview",
95
- "retrieved_kb_ids": [
96
- "RAGKB-0002",
97
- "RAGKB-0003",
98
- "RAGKB-0005"
99
- ],
100
- "retrieved_sections": [
101
- "History of the Faculty",
102
- "History of the Faculty",
103
- "History of the Faculty"
104
- ],
105
- "retrieved_scopes": [
106
- "general",
107
- "general",
108
- "general"
109
- ],
110
- "prompt": [
111
- {
112
- "role": "system",
113
- "content": "You are an academic assistant for the Faculty of Computer Science and Information Technology, Universiti Malaya. Answer only with handbook-grounded information. Use the retrieved handbook evidence when it is provided. Keep the answer direct, specific, and faithful to the handbook. If the evidence does not support a claim, say so clearly and briefly."
114
- },
115
- {
116
- "role": "user",
117
- "content": "Use the retrieved handbook evidence to answer the question. Base the answer on the evidence and keep it faithful to the handbook.\n\n[Retrieved Evidence 1]\nSource document: General Handbook\nScope: general\nSection: History of the Faculty\nSubsection: History Overview\nPages: 10\nKnowledge group: KG-0011\nChunk id: SC-00002\nText:\nThe provision of computer facilities and services at the Universiti Malaya (UM) began soon after the Computer Centre was officially formed in 1965. This made the university one of the pioneers in computer usage in Malaysia. In December 1969, the Computer Centre took on an additional role of teaching and research of computer science and information technology. The Computer Centre Board was formed, comprising the Vice-Chancellor (as Chairman), the Director of Computer Centre (as Secretary), and a representative from each Faculty, Institute, Centre and the University Senate. In 1974, the Diploma in Computer Science programme was introduced. From its inception in the 1974/1975 Session to the 199 ...[truncated]\n\n[Retrieved Evidence 2]\nSource document: General Handbook\nScope: general\nSection: History of the Faculty\nSubsection: History Overview\nPages: 10\nKnowledge group: KG-0011\nChunk id: SC-00003\nText:\nprogramme. The first undergraduate enrolment for the 1990/1991 Session was 50 students. In April 1st, 1993, the University Senate agreed to the formation of the Computer Centre Study Board. The Board proposed the establishment of a faculty to be called the Faculty of Computer Science and Information Technology (FCSIT). The existing Computer Centre was to be annulled and replaced by a Computer Services Division which was placed under the Chancellery. On September 22nd, 1994, the University of Malaya Council agreed to the formation of the Faculty of Computer Science and Information Technology (FCSIT), and the Computer Services Division. A sum of 4.2 million was obtained from the Ministry of Ed ...[truncated]\n\n[Retrieved Evidence 3]\nSource document: General Handbook\nScope: general\nSection: History of the Faculty\nSubsection: History Overview\nPages: 11\nKnowledge group: KG-0011\nChunk id: SC-00005\nText:\nProfessor Dato' Dr. Ir. Mashkuri Hj. Yaacob Professor Dr. Mohd Sapiyan Baba Professor Dr. David Ngo Chek Ling Professor Dr. Wan Ahmad Tajuddin Wan Abdullah Professor Dr. Siti Salwah Salim Professor Dr. Abdullah Gani Professor Dr. Abrizah Abdullah Professor Datin Dr. Sameem Abdul Kareem Professor Dr. Loo Chu Kiong Professor Ir. Dr. Chan Chee Seng Associate Professor Dr. Norisma Idris\n\nQuestion: What key milestones are mentioned in the faculty history?"
118
- }
119
- ],
120
- "completion": [
121
- {
122
- "role": "assistant",
123
- "content": "Key milestones include the formation of the Computer Centre, the start of teaching and research in 1969, the introduction of the Diploma in Computer Science in 1974, approval and administration of the Master of Computer Science and PhD research programmes in 1985, the 1993 proposal to establish FCSIT, formal approval in 1994, the opening of the faculty building in 1996, the start of the Bachelor of Information Technology in 1996/97, and the establishment of four departments in 1997."
124
- }
125
- ],
126
- "text": "<|im_start|>system\nYou are an academic assistant for the Faculty of Computer Science and Information Technology, Universiti Malaya. Answer only with handbook-grounded information. Use the retrieved handbook evidence when it is provided. Keep the answer direct, specific, and faithful to the handbook. If the evidence does not support a claim, say so clearly and briefly.<|im_end|>\n<|im_start|>user\nUse the retrieved handbook evidence to answer the question. Base the answer on the evidence and keep it faithful to the handbook.\n\n[Retrieved Evidence 1]\nSource document: General Handbook\nScope: general\nSection: History of the Faculty\nSubsection: History Overview\nPages: 10\nKnowledge group: KG-0011\nChunk id: SC-00002\nText:\nThe provision of computer facilities and services at the Universiti Malaya (UM) began soon after the Computer Centre was officially formed in 1965. This made the university one of the pioneers in computer usage in Malaysia. In December 1969, the Computer Centre took on an additional role of teaching and research of computer science and information technology. The Computer Centre Board was formed, comprising the Vice-Chancellor (as Chairman), the Director of Computer Centre (as Secretary), and a representative from each Faculty, Institute, Centre and the University Senate. In 1974, the Diploma in Computer Science programme was introduced. From its inception in the 1974/1975 Session to the 199 ...[truncated]\n\n[Retrieved Evidence 2]\nSource document: General Handbook\nScope: general\nSection: History of the Faculty\nSubsection: History Overview\nPages: 10\nKnowledge group: KG-0011\nChunk id: SC-00003\nText:\nprogramme. The first undergraduate enrolment for the 1990/1991 Session was 50 students. In April 1st, 1993, the University Senate agreed to the formation of the Computer Centre Study Board. The Board proposed the establishment of a faculty to be called the Faculty of Computer Science and Information Technology (FCSIT). The existing Computer Centre was to be annulled and replaced by a Computer Services Division which was placed under the Chancellery. On September 22nd, 1994, the University of Malaya Council agreed to the formation of the Faculty of Computer Science and Information Technology (FCSIT), and the Computer Services Division. A sum of 4.2 million was obtained from the Ministry of Ed ...[truncated]\n\n[Retrieved Evidence 3]\nSource document: General Handbook\nScope: general\nSection: History of the Faculty\nSubsection: History Overview\nPages: 11\nKnowledge group: KG-0011\nChunk id: SC-00005\nText:\nProfessor Dato' Dr. Ir. Mashkuri Hj. Yaacob Professor Dr. Mohd Sapiyan Baba Professor Dr. David Ngo Chek Ling Professor Dr. Wan Ahmad Tajuddin Wan Abdullah Professor Dr. Siti Salwah Salim Professor Dr. Abdullah Gani Professor Dr. Abrizah Abdullah Professor Datin Dr. Sameem Abdul Kareem Professor Dr. Loo Chu Kiong Professor Ir. Dr. Chan Chee Seng Associate Professor Dr. Norisma Idris\n\nQuestion: What key milestones are mentioned in the faculty history?<|im_end|>\n<|im_start|>assistant\n<think>\n\n</think>\n\nKey milestones include the formation of the Computer Centre, the start of teaching and research in 1969, the introduction of the Diploma in Computer Science in 1974, approval and administration of the Master of Computer Science and PhD research programmes in 1985, the 1993 proposal to establish FCSIT, formal approval in 1994, the opening of the faculty building in 1996, the start of the Bachelor of Information Technology in 1996/97, and the establishment of four departments in 1997.<|im_end|>\n"
127
- },
128
- {
129
- "qa_id": "qa_000004",
130
- "index_id": "UMI-0004",
131
- "question": "What is the academic calendar for master and doctorate level in session 2025/2026?",
132
- "answer": "The 2025/2026 master and doctorate academic calendar with Semester I, Semester II, and a special semester, covering orientation, lecture periods, mid-semester breaks, revision weeks, final examinations, and semester breaks. Semester I: Orientation (WOW) 05.10.2025-12.10.2025; lectures 13.10.2025-23.11.2025 and 01.12.2025-25.01.2026; mid-semester break 24.11.2025-30.11.2025; revision week 26.01.2026-01.02.2026; final examination 02.02.2026-22.02.2026; semester break 23.02.2026-08.03.2026. Semester II: lectures 09.03.2026-26.04.2026 and 04.05.2026-21.06.2026; break 27.04.2026-03.05.2026; revision week 22.06.2026-28.06.2026; final examination 29.06.2026-19.07.2026; semester break 20.07.2026-16.08.2026. Special semester: lectures 27.07.2026-13.09.2026; final examination 14.09.2026-20.09.2026; break 21.09.2026-28.09.2026. Public holidays listed include Deepavali, Christmas, New Year, Thaipusam, Federal Territory Day, Chinese New Year, Nuzul Al-Quran, Eidul Fitri, Labour Day, Eidul Adha, Wesak Day, His Majesty the King's Birthday, Awal Muharram, Prophet Muhammad's Birthday, National Day, and Malaysia Day. The notes state that the module registration and examination schedule can be referred to in the UM system guide, the calendar is subject to change, and UM PG iFest 2026 is scheduled for 09-11 June 2026.",
133
- "scope_label": "postgraduate",
134
- "source_doc": "General Handbook",
135
- "section": "Academic Calendar 2025/2026",
136
- "subsection": "Master and Doctorate Level Academic Calendar",
137
- "retrieved_kb_ids": [
138
- "RAGKB-0006",
139
- "RAGKB-0007",
140
- "RAGKB-0009"
141
- ],
142
- "retrieved_sections": [
143
- "Academic Calendar 2025/2026",
144
- "Academic Calendar 2025/2026",
145
- "Academic Calendar 2025/2026"
146
- ],
147
- "retrieved_scopes": [
148
- "postgraduate",
149
- "postgraduate",
150
- "undergraduate"
151
- ],
152
- "prompt": [
153
- {
154
- "role": "system",
155
- "content": "You are an academic assistant for the Faculty of Computer Science and Information Technology, Universiti Malaya. Answer only with handbook-grounded information. Use the retrieved handbook evidence when it is provided. Keep the answer direct, specific, and faithful to the handbook. If the evidence does not support a claim, say so clearly and briefly."
156
- },
157
- {
158
- "role": "user",
159
- "content": "Use the retrieved handbook evidence to answer the question. Base the answer on the evidence and keep it faithful to the handbook.\n\n[Retrieved Evidence 1]\nSource document: General Handbook\nScope: postgraduate\nSection: Academic Calendar 2025/2026\nSubsection: Master and Doctorate Level Academic Calendar\nPages: 4\nKnowledge group: KG-0064\nChunk id: SC-00006\nText:\nLampiran B2 ACADEMIC CALENDAR 2025/2026 ACADEMIC SESSION (MASTER AND DOCTORATE LEVEL) AMENDMENT ‘SEMESTER | ‘Orientation (Week of Welcome)-WOW 1 week 05.10.2025 = «= 12.10.2025 Lectures, 6 weeks\" 19.10.2028 - 23.11.2025 Mid Semester | Break 1 week 24.11.2025 = © 30.11.2025 Lectures. 8 weeks\" 01.12.2025 = © 25.01.2026 Revision Week 1 weeks\" 26.01.2028 © - 01.02.2026 ‘Semester | Final Examination 3 weeks\" 02.02.2026 - © 2202.2026 ‘Semester | Break 2 week 23.02.2028 - 08.03.2026 22 weeks ‘SEMESTER I Lectures: 7 weeks\" 09.03.2026 - 26.04.2026 ‘Mid Semester II Break 1 week 27.04.2028 © - 03.05.2026 Lectures, 7 weeks* 04052026 - 21.06.2026 Revision Week 1 week* 22.06.2026 - 28.06.2026 ‘Semester II ...[truncated]\n\n[Retrieved Evidence 2]\nSource document: General Handbook\nScope: postgraduate\nSection: Academic Calendar 2025/2026\nSubsection: Master and Doctorate Level Academic Calendar\nPages: 4\nKnowledge group: KG-0064\nChunk id: SC-00007\nText:\n(1) The Module Registration and Examination Schedule can be referred to at tips /umsitsquide um edu my. All, information is subject to change. (0) The Academic Calendar has taken into account public and festive holidays and is subject to change Deepavali 20 October 2025 (Monday) CChvistnas Day 2 December 2025 (Thursday) New Year 04 Janvary 2026 (Thursday) ‘Thaipusam 01 February 2026 (Sunday) Federal Tertitory Day 01 February 2026 (Sunday) ‘Chinese New Year 17 & 18 Fetruary 2026 (Tuesday & Wednesday) Nuzul Al-Quran, 07 March 2026 (Saturday) Edu Fn 20.21 March 2026 (Friday & Saturday) Labour Day 1 May 2026 (Friday) idl Adhal 27 May 2026 (Wednesday) Wesak Day 34 May 2026 (Sunday) His Majesty th ...[truncated]\n\n[Retrieved Evidence 3]\nSource document: General Handbook\nScope: undergraduate\nSection: Academic Calendar 2025/2026\nSubsection: Bachelor Degree Level Academic Calendar\nPages: 12\nKnowledge group: KG-0087\nChunk id: SC-00009\nText:\n(1) The Module Registration and Examination Schedule can be referred to at https://umsitsquide um edumy, All information is subject to change. (() The Academic Calendar has taken into account public and festive holidays and is subject to change’ Deepavali 20 October 2028 (Monday) ‘Christmas Day 25 December 2025 (Thursday) New Year 01 January 2026 (Thursday) ‘Thaipusam 01 February 2026 (Sunday) Federal Tertory Day (01 February 2026 (Sunday) Chinese New Year 17 & 18 February 2026 (Tuesday & Wednesday) ‘Nuzul Al-Quran 07 March 2026 (Saturday) Eidul Ft 20 & 21 March 2026 (Friday & Saturday) Labour Day, 01 May 2026 (Friday) Eidul Adna (27 May 2026 (Wednesday) Wesak Day 31 May 2026 (Sunday) His Ma ...[truncated]\n\nQuestion: What is the academic calendar for master and doctorate level in session 2025/2026?"
160
- }
161
- ],
162
- "completion": [
163
- {
164
- "role": "assistant",
165
- "content": "The 2025/2026 master and doctorate academic calendar with Semester I, Semester II, and a special semester, covering orientation, lecture periods, mid-semester breaks, revision weeks, final examinations, and semester breaks. Semester I: Orientation (WOW) 05.10.2025-12.10.2025; lectures 13.10.2025-23.11.2025 and 01.12.2025-25.01.2026; mid-semester break 24.11.2025-30.11.2025; revision week 26.01.2026-01.02.2026; final examination 02.02.2026-22.02.2026; semester break 23.02.2026-08.03.2026. Semester II: lectures 09.03.2026-26.04.2026 and 04.05.2026-21.06.2026; break 27.04.2026-03.05.2026; revision week 22.06.2026-28.06.2026; final examination 29.06.2026-19.07.2026; semester break 20.07.2026-16.08.2026. Special semester: lectures 27.07.2026-13.09.2026; final examination 14.09.2026-20.09.2026; break 21.09.2026-28.09.2026. Public holidays listed include Deepavali, Christmas, New Year, Thaipusam, Federal Territory Day, Chinese New Year, Nuzul Al-Quran, Eidul Fitri, Labour Day, Eidul Adha, Wesak Day, His Majesty the King's Birthday, Awal Muharram, Prophet Muhammad's Birthday, National Day, and Malaysia Day. The notes state that the module registration and examination schedule can be referred to in the UM system guide, the calendar is subject to change, and UM PG iFest 2026 is scheduled for 09-11 June 2026."
166
- }
167
- ],
168
- "text": "<|im_start|>system\nYou are an academic assistant for the Faculty of Computer Science and Information Technology, Universiti Malaya. Answer only with handbook-grounded information. Use the retrieved handbook evidence when it is provided. Keep the answer direct, specific, and faithful to the handbook. If the evidence does not support a claim, say so clearly and briefly.<|im_end|>\n<|im_start|>user\nUse the retrieved handbook evidence to answer the question. Base the answer on the evidence and keep it faithful to the handbook.\n\n[Retrieved Evidence 1]\nSource document: General Handbook\nScope: postgraduate\nSection: Academic Calendar 2025/2026\nSubsection: Master and Doctorate Level Academic Calendar\nPages: 4\nKnowledge group: KG-0064\nChunk id: SC-00006\nText:\nLampiran B2 ACADEMIC CALENDAR 2025/2026 ACADEMIC SESSION (MASTER AND DOCTORATE LEVEL) AMENDMENT ‘SEMESTER | ‘Orientation (Week of Welcome)-WOW 1 week 05.10.2025 = «= 12.10.2025 Lectures, 6 weeks\" 19.10.2028 - 23.11.2025 Mid Semester | Break 1 week 24.11.2025 = © 30.11.2025 Lectures. 8 weeks\" 01.12.2025 = © 25.01.2026 Revision Week 1 weeks\" 26.01.2028 © - 01.02.2026 ‘Semester | Final Examination 3 weeks\" 02.02.2026 - © 2202.2026 ‘Semester | Break 2 week 23.02.2028 - 08.03.2026 22 weeks ‘SEMESTER I Lectures: 7 weeks\" 09.03.2026 - 26.04.2026 ‘Mid Semester II Break 1 week 27.04.2028 © - 03.05.2026 Lectures, 7 weeks* 04052026 - 21.06.2026 Revision Week 1 week* 22.06.2026 - 28.06.2026 ‘Semester II ...[truncated]\n\n[Retrieved Evidence 2]\nSource document: General Handbook\nScope: postgraduate\nSection: Academic Calendar 2025/2026\nSubsection: Master and Doctorate Level Academic Calendar\nPages: 4\nKnowledge group: KG-0064\nChunk id: SC-00007\nText:\n(1) The Module Registration and Examination Schedule can be referred to at tips /umsitsquide um edu my. All, information is subject to change. (0) The Academic Calendar has taken into account public and festive holidays and is subject to change Deepavali 20 October 2025 (Monday) CChvistnas Day 2 December 2025 (Thursday) New Year 04 Janvary 2026 (Thursday) ‘Thaipusam 01 February 2026 (Sunday) Federal Tertitory Day 01 February 2026 (Sunday) ‘Chinese New Year 17 & 18 Fetruary 2026 (Tuesday & Wednesday) Nuzul Al-Quran, 07 March 2026 (Saturday) Edu Fn 20.21 March 2026 (Friday & Saturday) Labour Day 1 May 2026 (Friday) idl Adhal 27 May 2026 (Wednesday) Wesak Day 34 May 2026 (Sunday) His Majesty th ...[truncated]\n\n[Retrieved Evidence 3]\nSource document: General Handbook\nScope: undergraduate\nSection: Academic Calendar 2025/2026\nSubsection: Bachelor Degree Level Academic Calendar\nPages: 12\nKnowledge group: KG-0087\nChunk id: SC-00009\nText:\n(1) The Module Registration and Examination Schedule can be referred to at https://umsitsquide um edumy, All information is subject to change. (() The Academic Calendar has taken into account public and festive holidays and is subject to change’ Deepavali 20 October 2028 (Monday) ‘Christmas Day 25 December 2025 (Thursday) New Year 01 January 2026 (Thursday) ‘Thaipusam 01 February 2026 (Sunday) Federal Tertory Day (01 February 2026 (Sunday) Chinese New Year 17 & 18 February 2026 (Tuesday & Wednesday) ‘Nuzul Al-Quran 07 March 2026 (Saturday) Eidul Ft 20 & 21 March 2026 (Friday & Saturday) Labour Day, 01 May 2026 (Friday) Eidul Adna (27 May 2026 (Wednesday) Wesak Day 31 May 2026 (Sunday) His Ma ...[truncated]\n\nQuestion: What is the academic calendar for master and doctorate level in session 2025/2026?<|im_end|>\n<|im_start|>assistant\n<think>\n\n</think>\n\nThe 2025/2026 master and doctorate academic calendar with Semester I, Semester II, and a special semester, covering orientation, lecture periods, mid-semester breaks, revision weeks, final examinations, and semester breaks. Semester I: Orientation (WOW) 05.10.2025-12.10.2025; lectures 13.10.2025-23.11.2025 and 01.12.2025-25.01.2026; mid-semester break 24.11.2025-30.11.2025; revision week 26.01.2026-01.02.2026; final examination 02.02.2026-22.02.2026; semester break 23.02.2026-08.03.2026. Semester II: lectures 09.03.2026-26.04.2026 and 04.05.2026-21.06.2026; break 27.04.2026-03.05.2026; revision week 22.06.2026-28.06.2026; final examination 29.06.2026-19.07.2026; semester break 20.07.2026-16.08.2026. Special semester: lectures 27.07.2026-13.09.2026; final examination 14.09.2026-20.09.2026; break 21.09.2026-28.09.2026. Public holidays listed include Deepavali, Christmas, New Year, Thaipusam, Federal Territory Day, Chinese New Year, Nuzul Al-Quran, Eidul Fitri, Labour Day, Eidul Adha, Wesak Day, His Majesty the King's Birthday, Awal Muharram, Prophet Muhammad's Birthday, National Day, and Malaysia Day. The notes state that the module registration and examination schedule can be referred to in the UM system guide, the calendar is subject to change, and UM PG iFest 2026 is scheduled for 09-11 June 2026.<|im_end|>\n"
169
- },
170
- {
171
- "qa_id": "qa_000005",
172
- "index_id": "UMI-0005",
173
- "question": "What is the academic calendar for bachelor degree level in session 2025/2026?",
174
- "answer": "The 2025/2026 bachelor degree academic calendar with Semester I, Semester II, and a special semester, covering orientation, lecture periods, mid-semester breaks, revision weeks, final examinations, and semester breaks. Semester I: Orientation (WOW) 05.10.2025-12.10.2025; lectures 13.10.2025-23.11.2025 and 01.12.2025-25.01.2026; mid-semester break 24.11.2025-30.11.2025; revision week 26.01.2026-01.02.2026; final examination 02.02.2026-22.02.2026; semester break 23.02.2026-08.03.2026. Semester II: lectures 09.03.2026-26.04.2026 and 04.05.2026-21.06.2026; break 27.04.2026-03.05.2026; revision week 22.06.2026-28.06.2026; final examination 29.06.2026-19.07.2026; semester break 20.07.2026-16.08.2026. Special semester: lectures 27.07.2026-13.09.2026; final examination 14.09.2026-20.09.2026; break 21.09.2026-28.09.2026. Public holidays listed include Deepavali, Christmas, New Year, Thaipusam, Federal Territory Day, Chinese New Year, Nuzul Al-Quran, Eidul Fitri, Labour Day, Eidul Adha, Wesak Day, His Majesty the King's Birthday, Awal Muharram, Prophet Muhammad's Birthday, National Day, and Malaysia Day. The notes state that the module registration and examination schedule can be referred to in the UM system guide, the calendar is subject to change, and UM UG iFest 2026 is scheduled for 09-11 June 2026.",
175
- "scope_label": "undergraduate",
176
- "source_doc": "General Handbook",
177
- "section": "Academic Calendar 2025/2026",
178
- "subsection": "Bachelor Degree Level Academic Calendar",
179
- "retrieved_kb_ids": [
180
- "RAGKB-0009",
181
- "RAGKB-0008",
182
- "RAGKB-0007"
183
- ],
184
- "retrieved_sections": [
185
- "Academic Calendar 2025/2026",
186
- "Academic Calendar 2025/2026",
187
- "Academic Calendar 2025/2026"
188
- ],
189
- "retrieved_scopes": [
190
- "undergraduate",
191
- "undergraduate",
192
- "postgraduate"
193
- ],
194
- "prompt": [
195
- {
196
- "role": "system",
197
- "content": "You are an academic assistant for the Faculty of Computer Science and Information Technology, Universiti Malaya. Answer only with handbook-grounded information. Use the retrieved handbook evidence when it is provided. Keep the answer direct, specific, and faithful to the handbook. If the evidence does not support a claim, say so clearly and briefly."
198
- },
199
- {
200
- "role": "user",
201
- "content": "Use the retrieved handbook evidence to answer the question. Base the answer on the evidence and keep it faithful to the handbook.\n\n[Retrieved Evidence 1]\nSource document: General Handbook\nScope: undergraduate\nSection: Academic Calendar 2025/2026\nSubsection: Bachelor Degree Level Academic Calendar\nPages: 12\nKnowledge group: KG-0087\nChunk id: SC-00009\nText:\n(1) The Module Registration and Examination Schedule can be referred to at https://umsitsquide um edumy, All information is subject to change. (() The Academic Calendar has taken into account public and festive holidays and is subject to change’ Deepavali 20 October 2028 (Monday) ‘Christmas Day 25 December 2025 (Thursday) New Year 01 January 2026 (Thursday) ‘Thaipusam 01 February 2026 (Sunday) Federal Tertory Day (01 February 2026 (Sunday) Chinese New Year 17 & 18 February 2026 (Tuesday & Wednesday) ‘Nuzul Al-Quran 07 March 2026 (Saturday) Eidul Ft 20 & 21 March 2026 (Friday & Saturday) Labour Day, 01 May 2026 (Friday) Eidul Adna (27 May 2026 (Wednesday) Wesak Day 31 May 2026 (Sunday) His Ma ...[truncated]\n\n[Retrieved Evidence 2]\nSource document: General Handbook\nScope: undergraduate\nSection: Academic Calendar 2025/2026\nSubsection: Bachelor Degree Level Academic Calendar\nPages: 12\nKnowledge group: KG-0087\nChunk id: SC-00008\nText:\nEy ACADEMIC CALENDAR et SESSION 2025/2026 A eee ACADEMIC CALENDAR 2025/2026 ACADEMIC SESSION (BACHELOR DEGREE LEVEL) AMENDMENT SEMESTER | Orientation (Week of Welcome)-WOW 1 week 05.10.2025 - 12.10.2025 Lectures 6 weeks* 13.10.2025 - = 23.11.2025 Mid Semester | Break 1 week 24.11.2025 - 30.11.2025 Lectures, 8 weeks* 01.12.2025 - — 26.01.2026 Revision Week 1 weeks* 26.01.2026 - 01.02.2026 ‘Semester | Final Examination 3 weeks* 02.02.2026 - 22.02.2026 ‘Semester | Break 2 week 23.02.2026 - 08.03.2026 22 weeks ‘SEMESTER I Lectures 7 weeks* 09.03.2026 - 26.04.2026 Mid Semester II Break 1 week 27.04.2026 - 03.05.2026 Lectures. 7 weeks* 04.05.2026 - 21.06.2026 Revision Week 1 week\" 22.06.2026 - 28. ...[truncated]\n\n[Retrieved Evidence 3]\nSource document: General Handbook\nScope: postgraduate\nSection: Academic Calendar 2025/2026\nSubsection: Master and Doctorate Level Academic Calendar\nPages: 4\nKnowledge group: KG-0064\nChunk id: SC-00007\nText:\n(1) The Module Registration and Examination Schedule can be referred to at tips /umsitsquide um edu my. All, information is subject to change. (0) The Academic Calendar has taken into account public and festive holidays and is subject to change Deepavali 20 October 2025 (Monday) CChvistnas Day 2 December 2025 (Thursday) New Year 04 Janvary 2026 (Thursday) ‘Thaipusam 01 February 2026 (Sunday) Federal Tertitory Day 01 February 2026 (Sunday) ‘Chinese New Year 17 & 18 Fetruary 2026 (Tuesday & Wednesday) Nuzul Al-Quran, 07 March 2026 (Saturday) Edu Fn 20.21 March 2026 (Friday & Saturday) Labour Day 1 May 2026 (Friday) idl Adhal 27 May 2026 (Wednesday) Wesak Day 34 May 2026 (Sunday) His Majesty th ...[truncated]\n\nQuestion: What is the academic calendar for bachelor degree level in session 2025/2026?"
202
- }
203
- ],
204
- "completion": [
205
- {
206
- "role": "assistant",
207
- "content": "The 2025/2026 bachelor degree academic calendar with Semester I, Semester II, and a special semester, covering orientation, lecture periods, mid-semester breaks, revision weeks, final examinations, and semester breaks. Semester I: Orientation (WOW) 05.10.2025-12.10.2025; lectures 13.10.2025-23.11.2025 and 01.12.2025-25.01.2026; mid-semester break 24.11.2025-30.11.2025; revision week 26.01.2026-01.02.2026; final examination 02.02.2026-22.02.2026; semester break 23.02.2026-08.03.2026. Semester II: lectures 09.03.2026-26.04.2026 and 04.05.2026-21.06.2026; break 27.04.2026-03.05.2026; revision week 22.06.2026-28.06.2026; final examination 29.06.2026-19.07.2026; semester break 20.07.2026-16.08.2026. Special semester: lectures 27.07.2026-13.09.2026; final examination 14.09.2026-20.09.2026; break 21.09.2026-28.09.2026. Public holidays listed include Deepavali, Christmas, New Year, Thaipusam, Federal Territory Day, Chinese New Year, Nuzul Al-Quran, Eidul Fitri, Labour Day, Eidul Adha, Wesak Day, His Majesty the King's Birthday, Awal Muharram, Prophet Muhammad's Birthday, National Day, and Malaysia Day. The notes state that the module registration and examination schedule can be referred to in the UM system guide, the calendar is subject to change, and UM UG iFest 2026 is scheduled for 09-11 June 2026."
208
- }
209
- ],
210
- "text": "<|im_start|>system\nYou are an academic assistant for the Faculty of Computer Science and Information Technology, Universiti Malaya. Answer only with handbook-grounded information. Use the retrieved handbook evidence when it is provided. Keep the answer direct, specific, and faithful to the handbook. If the evidence does not support a claim, say so clearly and briefly.<|im_end|>\n<|im_start|>user\nUse the retrieved handbook evidence to answer the question. Base the answer on the evidence and keep it faithful to the handbook.\n\n[Retrieved Evidence 1]\nSource document: General Handbook\nScope: undergraduate\nSection: Academic Calendar 2025/2026\nSubsection: Bachelor Degree Level Academic Calendar\nPages: 12\nKnowledge group: KG-0087\nChunk id: SC-00009\nText:\n(1) The Module Registration and Examination Schedule can be referred to at https://umsitsquide um edumy, All information is subject to change. (() The Academic Calendar has taken into account public and festive holidays and is subject to change’ Deepavali 20 October 2028 (Monday) ‘Christmas Day 25 December 2025 (Thursday) New Year 01 January 2026 (Thursday) ‘Thaipusam 01 February 2026 (Sunday) Federal Tertory Day (01 February 2026 (Sunday) Chinese New Year 17 & 18 February 2026 (Tuesday & Wednesday) ‘Nuzul Al-Quran 07 March 2026 (Saturday) Eidul Ft 20 & 21 March 2026 (Friday & Saturday) Labour Day, 01 May 2026 (Friday) Eidul Adna (27 May 2026 (Wednesday) Wesak Day 31 May 2026 (Sunday) His Ma ...[truncated]\n\n[Retrieved Evidence 2]\nSource document: General Handbook\nScope: undergraduate\nSection: Academic Calendar 2025/2026\nSubsection: Bachelor Degree Level Academic Calendar\nPages: 12\nKnowledge group: KG-0087\nChunk id: SC-00008\nText:\nEy ACADEMIC CALENDAR et SESSION 2025/2026 A eee ACADEMIC CALENDAR 2025/2026 ACADEMIC SESSION (BACHELOR DEGREE LEVEL) AMENDMENT SEMESTER | Orientation (Week of Welcome)-WOW 1 week 05.10.2025 - 12.10.2025 Lectures 6 weeks* 13.10.2025 - = 23.11.2025 Mid Semester | Break 1 week 24.11.2025 - 30.11.2025 Lectures, 8 weeks* 01.12.2025 - — 26.01.2026 Revision Week 1 weeks* 26.01.2026 - 01.02.2026 ‘Semester | Final Examination 3 weeks* 02.02.2026 - 22.02.2026 ‘Semester | Break 2 week 23.02.2026 - 08.03.2026 22 weeks ‘SEMESTER I Lectures 7 weeks* 09.03.2026 - 26.04.2026 Mid Semester II Break 1 week 27.04.2026 - 03.05.2026 Lectures. 7 weeks* 04.05.2026 - 21.06.2026 Revision Week 1 week\" 22.06.2026 - 28. ...[truncated]\n\n[Retrieved Evidence 3]\nSource document: General Handbook\nScope: postgraduate\nSection: Academic Calendar 2025/2026\nSubsection: Master and Doctorate Level Academic Calendar\nPages: 4\nKnowledge group: KG-0064\nChunk id: SC-00007\nText:\n(1) The Module Registration and Examination Schedule can be referred to at tips /umsitsquide um edu my. All, information is subject to change. (0) The Academic Calendar has taken into account public and festive holidays and is subject to change Deepavali 20 October 2025 (Monday) CChvistnas Day 2 December 2025 (Thursday) New Year 04 Janvary 2026 (Thursday) ‘Thaipusam 01 February 2026 (Sunday) Federal Tertitory Day 01 February 2026 (Sunday) ‘Chinese New Year 17 & 18 Fetruary 2026 (Tuesday & Wednesday) Nuzul Al-Quran, 07 March 2026 (Saturday) Edu Fn 20.21 March 2026 (Friday & Saturday) Labour Day 1 May 2026 (Friday) idl Adhal 27 May 2026 (Wednesday) Wesak Day 34 May 2026 (Sunday) His Majesty th ...[truncated]\n\nQuestion: What is the academic calendar for bachelor degree level in session 2025/2026?<|im_end|>\n<|im_start|>assistant\n<think>\n\n</think>\n\nThe 2025/2026 bachelor degree academic calendar with Semester I, Semester II, and a special semester, covering orientation, lecture periods, mid-semester breaks, revision weeks, final examinations, and semester breaks. Semester I: Orientation (WOW) 05.10.2025-12.10.2025; lectures 13.10.2025-23.11.2025 and 01.12.2025-25.01.2026; mid-semester break 24.11.2025-30.11.2025; revision week 26.01.2026-01.02.2026; final examination 02.02.2026-22.02.2026; semester break 23.02.2026-08.03.2026. Semester II: lectures 09.03.2026-26.04.2026 and 04.05.2026-21.06.2026; break 27.04.2026-03.05.2026; revision week 22.06.2026-28.06.2026; final examination 29.06.2026-19.07.2026; semester break 20.07.2026-16.08.2026. Special semester: lectures 27.07.2026-13.09.2026; final examination 14.09.2026-20.09.2026; break 21.09.2026-28.09.2026. Public holidays listed include Deepavali, Christmas, New Year, Thaipusam, Federal Territory Day, Chinese New Year, Nuzul Al-Quran, Eidul Fitri, Labour Day, Eidul Adha, Wesak Day, His Majesty the King's Birthday, Awal Muharram, Prophet Muhammad's Birthday, National Day, and Malaysia Day. The notes state that the module registration and examination schedule can be referred to in the UM system guide, the calendar is subject to change, and UM UG iFest 2026 is scheduled for 09-11 June 2026.<|im_end|>\n"
211
- }
212
- ]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/rag_augmented_dataset/rag_text_length_summary.json DELETED
@@ -1,11 +0,0 @@
1
- {
2
- "count": 1000,
3
- "min_tokens": 446,
4
- "p50_tokens": 800,
5
- "p90_tokens": 1036,
6
- "p95_tokens": 1234,
7
- "p99_tokens": 1488,
8
- "max_tokens": 1987,
9
- "configured_max_seq_length": 1024,
10
- "examples_over_max_seq_length": 114
11
- }
 
 
 
 
 
 
 
 
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/retrieval_eval/retrieval_details.jsonl DELETED
The diff for this file is too large to render. See raw diff
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/retrieval_eval/retrieval_metrics.json DELETED
@@ -1,10 +0,0 @@
1
- {
2
- "retrieval_eval_size": 1000,
3
- "top_k": 3,
4
- "hit_at_1_primary": 0.821,
5
- "hit_at_k_primary": 0.954,
6
- "hit_at_k_same_group": 0.991,
7
- "scope_match_at_1": 0.996,
8
- "retriever_type": "dense_embedding + faiss + metadata_rerank",
9
- "embedding_model_name": "BAAI/bge-base-en-v1.5"
10
- }
 
 
 
 
 
 
 
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/README.md DELETED
@@ -1,57 +0,0 @@
1
- ---
2
- library_name: transformers
3
- model_name: trainer_runs
4
- tags:
5
- - generated_from_trainer
6
- - sft
7
- - trl
8
- licence: license
9
- ---
10
-
11
- # Model Card for trainer_runs
12
-
13
- This model is a fine-tuned version of [None](https://huggingface.co/None).
14
- It has been trained using [TRL](https://github.com/huggingface/trl).
15
-
16
- ## Quick start
17
-
18
- ```python
19
- from transformers import pipeline
20
-
21
- question = "If you had a time machine, but could only go to the past or the future once and never return, which would you choose and why?"
22
- generator = pipeline("text-generation", model="None", device="cuda")
23
- output = generator([{"role": "user", "content": question}], max_new_tokens=128, return_full_text=False)[0]
24
- print(output["generated_text"])
25
- ```
26
-
27
- ## Training procedure
28
-
29
-
30
-
31
-
32
-
33
- This model was trained with SFT.
34
-
35
- ### Framework versions
36
-
37
- - TRL: 1.1.0
38
- - Transformers: 5.3.0
39
- - Pytorch: 2.5.1+cu121
40
- - Datasets: 2.19.2
41
- - Tokenizers: 0.22.2
42
-
43
- ## Citations
44
-
45
-
46
-
47
- Cite TRL as:
48
-
49
- ```bibtex
50
- @software{vonwerra2020trl,
51
- title = {{TRL: Transformers Reinforcement Learning}},
52
- author = {von Werra, Leandro and Belkada, Younes and Tunstall, Lewis and Beeching, Edward and Thrush, Tristan and Lambert, Nathan and Huang, Shengyi and Rasul, Kashif and Gallouédec, Quentin},
53
- license = {Apache-2.0},
54
- url = {https://github.com/huggingface/trl},
55
- year = {2020}
56
- }
57
- ```
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-1000/README.md DELETED
@@ -1,209 +0,0 @@
1
- ---
2
- base_model: /scr/user/kevin2002/TensorCat/NLP/UM_Handbook/models/Qwen3-8B
3
- library_name: peft
4
- pipeline_tag: text-generation
5
- tags:
6
- - base_model:adapter:/scr/user/kevin2002/TensorCat/NLP/UM_Handbook/models/Qwen3-8B
7
- - lora
8
- - sft
9
- - transformers
10
- - trl
11
- ---
12
-
13
- # Model Card for Model ID
14
-
15
- <!-- Provide a quick summary of what the model is/does. -->
16
-
17
-
18
-
19
- ## Model Details
20
-
21
- ### Model Description
22
-
23
- <!-- Provide a longer summary of what this model is. -->
24
-
25
-
26
-
27
- - **Developed by:** [More Information Needed]
28
- - **Funded by [optional]:** [More Information Needed]
29
- - **Shared by [optional]:** [More Information Needed]
30
- - **Model type:** [More Information Needed]
31
- - **Language(s) (NLP):** [More Information Needed]
32
- - **License:** [More Information Needed]
33
- - **Finetuned from model [optional]:** [More Information Needed]
34
-
35
- ### Model Sources [optional]
36
-
37
- <!-- Provide the basic links for the model. -->
38
-
39
- - **Repository:** [More Information Needed]
40
- - **Paper [optional]:** [More Information Needed]
41
- - **Demo [optional]:** [More Information Needed]
42
-
43
- ## Uses
44
-
45
- <!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
46
-
47
- ### Direct Use
48
-
49
- <!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
50
-
51
- [More Information Needed]
52
-
53
- ### Downstream Use [optional]
54
-
55
- <!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
56
-
57
- [More Information Needed]
58
-
59
- ### Out-of-Scope Use
60
-
61
- <!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
62
-
63
- [More Information Needed]
64
-
65
- ## Bias, Risks, and Limitations
66
-
67
- <!-- This section is meant to convey both technical and sociotechnical limitations. -->
68
-
69
- [More Information Needed]
70
-
71
- ### Recommendations
72
-
73
- <!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
74
-
75
- Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
76
-
77
- ## How to Get Started with the Model
78
-
79
- Use the code below to get started with the model.
80
-
81
- [More Information Needed]
82
-
83
- ## Training Details
84
-
85
- ### Training Data
86
-
87
- <!-- This should link to a Dataset Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
88
-
89
- [More Information Needed]
90
-
91
- ### Training Procedure
92
-
93
- <!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
94
-
95
- #### Preprocessing [optional]
96
-
97
- [More Information Needed]
98
-
99
-
100
- #### Training Hyperparameters
101
-
102
- - **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
103
-
104
- #### Speeds, Sizes, Times [optional]
105
-
106
- <!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
107
-
108
- [More Information Needed]
109
-
110
- ## Evaluation
111
-
112
- <!-- This section describes the evaluation protocols and provides the results. -->
113
-
114
- ### Testing Data, Factors & Metrics
115
-
116
- #### Testing Data
117
-
118
- <!-- This should link to a Dataset Card if possible. -->
119
-
120
- [More Information Needed]
121
-
122
- #### Factors
123
-
124
- <!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
125
-
126
- [More Information Needed]
127
-
128
- #### Metrics
129
-
130
- <!-- These are the evaluation metrics being used, ideally with a description of why. -->
131
-
132
- [More Information Needed]
133
-
134
- ### Results
135
-
136
- [More Information Needed]
137
-
138
- #### Summary
139
-
140
-
141
-
142
- ## Model Examination [optional]
143
-
144
- <!-- Relevant interpretability work for the model goes here -->
145
-
146
- [More Information Needed]
147
-
148
- ## Environmental Impact
149
-
150
- <!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
151
-
152
- Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
153
-
154
- - **Hardware Type:** [More Information Needed]
155
- - **Hours used:** [More Information Needed]
156
- - **Cloud Provider:** [More Information Needed]
157
- - **Compute Region:** [More Information Needed]
158
- - **Carbon Emitted:** [More Information Needed]
159
-
160
- ## Technical Specifications [optional]
161
-
162
- ### Model Architecture and Objective
163
-
164
- [More Information Needed]
165
-
166
- ### Compute Infrastructure
167
-
168
- [More Information Needed]
169
-
170
- #### Hardware
171
-
172
- [More Information Needed]
173
-
174
- #### Software
175
-
176
- [More Information Needed]
177
-
178
- ## Citation [optional]
179
-
180
- <!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
181
-
182
- **BibTeX:**
183
-
184
- [More Information Needed]
185
-
186
- **APA:**
187
-
188
- [More Information Needed]
189
-
190
- ## Glossary [optional]
191
-
192
- <!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
193
-
194
- [More Information Needed]
195
-
196
- ## More Information [optional]
197
-
198
- [More Information Needed]
199
-
200
- ## Model Card Authors [optional]
201
-
202
- [More Information Needed]
203
-
204
- ## Model Card Contact
205
-
206
- [More Information Needed]
207
- ### Framework versions
208
-
209
- - PEFT 0.18.1
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-1000/adapter_config.json DELETED
@@ -1,46 +0,0 @@
1
- {
2
- "alora_invocation_tokens": null,
3
- "alpha_pattern": {},
4
- "arrow_config": null,
5
- "auto_mapping": null,
6
- "base_model_name_or_path": "/scr/user/kevin2002/TensorCat/NLP/UM_Handbook/models/Qwen3-8B",
7
- "bias": "none",
8
- "corda_config": null,
9
- "ensure_weight_tying": false,
10
- "eva_config": null,
11
- "exclude_modules": null,
12
- "fan_in_fan_out": false,
13
- "inference_mode": true,
14
- "init_lora_weights": true,
15
- "layer_replication": null,
16
- "layers_pattern": null,
17
- "layers_to_transform": null,
18
- "loftq_config": {},
19
- "lora_alpha": 16,
20
- "lora_bias": false,
21
- "lora_dropout": 0.05,
22
- "megatron_config": null,
23
- "megatron_core": "megatron.core",
24
- "modules_to_save": null,
25
- "peft_type": "LORA",
26
- "peft_version": "0.18.1",
27
- "qalora_group_size": 16,
28
- "r": 8,
29
- "rank_pattern": {},
30
- "revision": null,
31
- "target_modules": [
32
- "o_proj",
33
- "up_proj",
34
- "q_proj",
35
- "down_proj",
36
- "k_proj",
37
- "v_proj",
38
- "gate_proj"
39
- ],
40
- "target_parameters": null,
41
- "task_type": "CAUSAL_LM",
42
- "trainable_token_indices": null,
43
- "use_dora": false,
44
- "use_qalora": false,
45
- "use_rslora": false
46
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-1000/adapter_model.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:dbd4b80a7609306be0907324ca37c80b133810797630ea660f1c2d0ccc4b7f40
3
- size 87360584
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-1000/chat_template.jinja DELETED
@@ -1,89 +0,0 @@
1
- {%- if tools %}
2
- {{- '<|im_start|>system\n' }}
3
- {%- if messages[0].role == 'system' %}
4
- {{- messages[0].content + '\n\n' }}
5
- {%- endif %}
6
- {{- "# Tools\n\nYou may call one or more functions to assist with the user query.\n\nYou are provided with function signatures within <tools></tools> XML tags:\n<tools>" }}
7
- {%- for tool in tools %}
8
- {{- "\n" }}
9
- {{- tool | tojson }}
10
- {%- endfor %}
11
- {{- "\n</tools>\n\nFor each function call, return a json object with function name and arguments within <tool_call></tool_call> XML tags:\n<tool_call>\n{\"name\": <function-name>, \"arguments\": <args-json-object>}\n</tool_call><|im_end|>\n" }}
12
- {%- else %}
13
- {%- if messages[0].role == 'system' %}
14
- {{- '<|im_start|>system\n' + messages[0].content + '<|im_end|>\n' }}
15
- {%- endif %}
16
- {%- endif %}
17
- {%- set ns = namespace(multi_step_tool=true, last_query_index=messages|length - 1) %}
18
- {%- for message in messages[::-1] %}
19
- {%- set index = (messages|length - 1) - loop.index0 %}
20
- {%- if ns.multi_step_tool and message.role == "user" and message.content is string and not(message.content.startswith('<tool_response>') and message.content.endswith('</tool_response>')) %}
21
- {%- set ns.multi_step_tool = false %}
22
- {%- set ns.last_query_index = index %}
23
- {%- endif %}
24
- {%- endfor %}
25
- {%- for message in messages %}
26
- {%- if message.content is string %}
27
- {%- set content = message.content %}
28
- {%- else %}
29
- {%- set content = '' %}
30
- {%- endif %}
31
- {%- if (message.role == "user") or (message.role == "system" and not loop.first) %}
32
- {{- '<|im_start|>' + message.role + '\n' + content + '<|im_end|>' + '\n' }}
33
- {%- elif message.role == "assistant" %}
34
- {%- set reasoning_content = '' %}
35
- {%- if message.reasoning_content is string %}
36
- {%- set reasoning_content = message.reasoning_content %}
37
- {%- else %}
38
- {%- if '</think>' in content %}
39
- {%- set reasoning_content = content.split('</think>')[0].rstrip('\n').split('<think>')[-1].lstrip('\n') %}
40
- {%- set content = content.split('</think>')[-1].lstrip('\n') %}
41
- {%- endif %}
42
- {%- endif %}
43
- {%- if loop.index0 > ns.last_query_index %}
44
- {%- if loop.last or (not loop.last and reasoning_content) %}
45
- {{- '<|im_start|>' + message.role + '\n<think>\n' + reasoning_content.strip('\n') + '\n</think>\n\n' + content.lstrip('\n') }}
46
- {%- else %}
47
- {{- '<|im_start|>' + message.role + '\n' + content }}
48
- {%- endif %}
49
- {%- else %}
50
- {{- '<|im_start|>' + message.role + '\n' + content }}
51
- {%- endif %}
52
- {%- if message.tool_calls %}
53
- {%- for tool_call in message.tool_calls %}
54
- {%- if (loop.first and content) or (not loop.first) %}
55
- {{- '\n' }}
56
- {%- endif %}
57
- {%- if tool_call.function %}
58
- {%- set tool_call = tool_call.function %}
59
- {%- endif %}
60
- {{- '<tool_call>\n{"name": "' }}
61
- {{- tool_call.name }}
62
- {{- '", "arguments": ' }}
63
- {%- if tool_call.arguments is string %}
64
- {{- tool_call.arguments }}
65
- {%- else %}
66
- {{- tool_call.arguments | tojson }}
67
- {%- endif %}
68
- {{- '}\n</tool_call>' }}
69
- {%- endfor %}
70
- {%- endif %}
71
- {{- '<|im_end|>\n' }}
72
- {%- elif message.role == "tool" %}
73
- {%- if loop.first or (messages[loop.index0 - 1].role != "tool") %}
74
- {{- '<|im_start|>user' }}
75
- {%- endif %}
76
- {{- '\n<tool_response>\n' }}
77
- {{- content }}
78
- {{- '\n</tool_response>' }}
79
- {%- if loop.last or (messages[loop.index0 + 1].role != "tool") %}
80
- {{- '<|im_end|>\n' }}
81
- {%- endif %}
82
- {%- endif %}
83
- {%- endfor %}
84
- {%- if add_generation_prompt %}
85
- {{- '<|im_start|>assistant\n' }}
86
- {%- if enable_thinking is defined and enable_thinking is false %}
87
- {{- '<think>\n\n</think>\n\n' }}
88
- {%- endif %}
89
- {%- endif %}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-1000/optimizer.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:a5cc8a6b6e65945a5f44363ec3f269aa0e5ae464a29df361c972db2874a5621f
3
- size 175019258
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-1000/rng_state.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:5a5928b921db1668cbcf0af4b32ba434c9435a70eee287442a4fcc4751f93b5d
3
- size 14244
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-1000/scheduler.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:fdf053492e46775ae2bc25e8348e495261299a36ab8b412170267cc0223f930e
3
- size 1064
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-1000/tokenizer.json DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:be75606093db2094d7cd20f3c2f385c212750648bd6ea4fb2bf507a6a4c55506
3
- size 11422650
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-1000/tokenizer_config.json DELETED
@@ -1,29 +0,0 @@
1
- {
2
- "add_prefix_space": false,
3
- "backend": "tokenizers",
4
- "bos_token": null,
5
- "clean_up_tokenization_spaces": false,
6
- "eos_token": "<|im_end|>",
7
- "errors": "replace",
8
- "extra_special_tokens": [
9
- "<|im_start|>",
10
- "<|im_end|>",
11
- "<|object_ref_start|>",
12
- "<|object_ref_end|>",
13
- "<|box_start|>",
14
- "<|box_end|>",
15
- "<|quad_start|>",
16
- "<|quad_end|>",
17
- "<|vision_start|>",
18
- "<|vision_end|>",
19
- "<|vision_pad|>",
20
- "<|image_pad|>",
21
- "<|video_pad|>"
22
- ],
23
- "is_local": true,
24
- "model_max_length": 131072,
25
- "pad_token": "<|endoftext|>",
26
- "split_special_tokens": false,
27
- "tokenizer_class": "Qwen2Tokenizer",
28
- "unk_token": null
29
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-1000/trainer_state.json DELETED
@@ -1,553 +0,0 @@
1
- {
2
- "best_global_step": 900,
3
- "best_metric": 0.1760927140712738,
4
- "best_model_checkpoint": "/scr/user/kevin2002/TensorCat/NLP/UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-900",
5
- "epoch": 10.0,
6
- "eval_steps": 500,
7
- "global_step": 1000,
8
- "is_hyper_param_search": false,
9
- "is_local_process_zero": true,
10
- "is_world_process_zero": true,
11
- "log_history": [
12
- {
13
- "entropy": 1.4358372974395752,
14
- "epoch": 0.25,
15
- "grad_norm": 0.14446501433849335,
16
- "learning_rate": 7.999671154713278e-05,
17
- "loss": 2.3676884460449217,
18
- "mean_token_accuracy": 0.5813838094472885,
19
- "num_tokens": 160725.0,
20
- "step": 25
21
- },
22
- {
23
- "entropy": 1.879828963279724,
24
- "epoch": 0.5,
25
- "grad_norm": 0.15517809987068176,
26
- "learning_rate": 7.982727278231343e-05,
27
- "loss": 1.7838900756835938,
28
- "mean_token_accuracy": 0.6484150147438049,
29
- "num_tokens": 327066.0,
30
- "step": 50
31
- },
32
- {
33
- "entropy": 1.4648912394046782,
34
- "epoch": 0.75,
35
- "grad_norm": 0.1660589873790741,
36
- "learning_rate": 7.940216640438628e-05,
37
- "loss": 1.4690559387207032,
38
- "mean_token_accuracy": 0.7019884788990021,
39
- "num_tokens": 490539.0,
40
- "step": 75
41
- },
42
- {
43
- "entropy": 1.3251829946041107,
44
- "epoch": 1.0,
45
- "grad_norm": 0.2699568569660187,
46
- "learning_rate": 7.872412134569766e-05,
47
- "loss": 1.312823028564453,
48
- "mean_token_accuracy": 0.726642736196518,
49
- "num_tokens": 656891.0,
50
- "step": 100
51
- },
52
- {
53
- "epoch": 1.0,
54
- "eval_entropy": 1.1702604523071876,
55
- "eval_loss": 1.1601083278656006,
56
- "eval_mean_token_accuracy": 0.7461812725433936,
57
- "eval_num_tokens": 656891.0,
58
- "eval_runtime": 14.1848,
59
- "eval_samples_per_second": 7.05,
60
- "eval_steps_per_second": 0.916,
61
- "step": 100
62
- },
63
- {
64
- "entropy": 0.9866749036312104,
65
- "epoch": 1.25,
66
- "grad_norm": 0.41134113073349,
67
- "learning_rate": 7.779749025581717e-05,
68
- "loss": 0.994763412475586,
69
- "mean_token_accuracy": 0.777331509590149,
70
- "num_tokens": 820900.0,
71
- "step": 125
72
- },
73
- {
74
- "entropy": 0.901508281826973,
75
- "epoch": 1.5,
76
- "grad_norm": 0.48528075218200684,
77
- "learning_rate": 7.662822156009336e-05,
78
- "loss": 0.903388442993164,
79
- "mean_token_accuracy": 0.8035100996494293,
80
- "num_tokens": 983751.0,
81
- "step": 150
82
- },
83
- {
84
- "entropy": 0.7128595209121704,
85
- "epoch": 1.75,
86
- "grad_norm": 0.5612214207649231,
87
- "learning_rate": 7.522382127426952e-05,
88
- "loss": 0.6967535400390625,
89
- "mean_token_accuracy": 0.8427894067764282,
90
- "num_tokens": 1148624.0,
91
- "step": 175
92
- },
93
- {
94
- "entropy": 0.5692075723409653,
95
- "epoch": 2.0,
96
- "grad_norm": 0.5570225715637207,
97
- "learning_rate": 7.35933048202875e-05,
98
- "loss": 0.5440200424194336,
99
- "mean_token_accuracy": 0.8759966826438904,
100
- "num_tokens": 1313782.0,
101
- "step": 200
102
- },
103
- {
104
- "epoch": 2.0,
105
- "eval_entropy": 0.6419096955886254,
106
- "eval_loss": 0.600500226020813,
107
- "eval_mean_token_accuracy": 0.861496246778048,
108
- "eval_num_tokens": 1313782.0,
109
- "eval_runtime": 14.1469,
110
- "eval_samples_per_second": 7.069,
111
- "eval_steps_per_second": 0.919,
112
- "step": 200
113
- },
114
- {
115
- "entropy": 0.44877232432365416,
116
- "epoch": 2.25,
117
- "grad_norm": 0.5958295464515686,
118
- "learning_rate": 7.174713915259331e-05,
119
- "loss": 0.41493446350097657,
120
- "mean_token_accuracy": 0.9032380354404449,
121
- "num_tokens": 1480714.0,
122
- "step": 225
123
- },
124
- {
125
- "entropy": 0.4503101620078087,
126
- "epoch": 2.5,
127
- "grad_norm": 0.7803889513015747,
128
- "learning_rate": 6.969717556645995e-05,
129
- "loss": 0.42063777923583984,
130
- "mean_token_accuracy": 0.9064690721035004,
131
- "num_tokens": 1645148.0,
132
- "step": 250
133
- },
134
- {
135
- "entropy": 0.3513291063904762,
136
- "epoch": 2.75,
137
- "grad_norm": 0.5489973425865173,
138
- "learning_rate": 6.745657361965803e-05,
139
- "loss": 0.32174919128417967,
140
- "mean_token_accuracy": 0.9250416386127472,
141
- "num_tokens": 1805051.0,
142
- "step": 275
143
- },
144
- {
145
- "entropy": 0.3790210232138634,
146
- "epoch": 3.0,
147
- "grad_norm": 0.9119548797607422,
148
- "learning_rate": 6.503971665585243e-05,
149
- "loss": 0.3341722106933594,
150
- "mean_token_accuracy": 0.9239817559719086,
151
- "num_tokens": 1970673.0,
152
- "step": 300
153
- },
154
- {
155
- "epoch": 3.0,
156
- "eval_entropy": 0.4204630897595332,
157
- "eval_loss": 0.38708260655403137,
158
- "eval_mean_token_accuracy": 0.9079863979266241,
159
- "eval_num_tokens": 1970673.0,
160
- "eval_runtime": 14.1106,
161
- "eval_samples_per_second": 7.087,
162
- "eval_steps_per_second": 0.921,
163
- "step": 300
164
- },
165
- {
166
- "entropy": 0.2572793909907341,
167
- "epoch": 3.25,
168
- "grad_norm": 0.4237155020236969,
169
- "learning_rate": 6.2462119472015e-05,
170
- "loss": 0.20618080139160155,
171
- "mean_token_accuracy": 0.9494317126274109,
172
- "num_tokens": 2133206.0,
173
- "step": 325
174
- },
175
- {
176
- "entropy": 0.29035701289772986,
177
- "epoch": 3.5,
178
- "grad_norm": 0.6824076175689697,
179
- "learning_rate": 5.974032872257388e-05,
180
- "loss": 0.25118282318115237,
181
- "mean_token_accuracy": 0.9438021230697632,
182
- "num_tokens": 2297449.0,
183
- "step": 350
184
- },
185
- {
186
- "entropy": 0.23607211165130138,
187
- "epoch": 3.75,
188
- "grad_norm": 0.8003197908401489,
189
- "learning_rate": 5.68918166996464e-05,
190
- "loss": 0.19911937713623046,
191
- "mean_token_accuracy": 0.9537552082538605,
192
- "num_tokens": 2462390.0,
193
- "step": 375
194
- },
195
- {
196
- "entropy": 0.23902728497982026,
197
- "epoch": 4.0,
198
- "grad_norm": 0.8474582433700562,
199
- "learning_rate": 5.393486917122353e-05,
200
- "loss": 0.20467203140258788,
201
- "mean_token_accuracy": 0.9515939724445343,
202
- "num_tokens": 2627564.0,
203
- "step": 400
204
- },
205
- {
206
- "epoch": 4.0,
207
- "eval_entropy": 0.31223052740097046,
208
- "eval_loss": 0.2847066819667816,
209
- "eval_mean_token_accuracy": 0.9322063556084266,
210
- "eval_num_tokens": 2627564.0,
211
- "eval_runtime": 13.9402,
212
- "eval_samples_per_second": 7.174,
213
- "eval_steps_per_second": 0.933,
214
- "step": 400
215
- },
216
- {
217
- "entropy": 0.17765841275453567,
218
- "epoch": 4.25,
219
- "grad_norm": 0.5740338563919067,
220
- "learning_rate": 5.088846799731885e-05,
221
- "loss": 0.13823826789855956,
222
- "mean_token_accuracy": 0.9671606945991517,
223
- "num_tokens": 2789214.0,
224
- "step": 425
225
- },
226
- {
227
- "entropy": 0.18791945070028304,
228
- "epoch": 4.5,
229
- "grad_norm": 0.30488306283950806,
230
- "learning_rate": 4.7772169277617086e-05,
231
- "loss": 0.14581723213195802,
232
- "mean_token_accuracy": 0.9664597606658936,
233
- "num_tokens": 2955470.0,
234
- "step": 450
235
- },
236
- {
237
- "entropy": 0.18473084963858127,
238
- "epoch": 4.75,
239
- "grad_norm": 0.5409578084945679,
240
- "learning_rate": 4.4605977812842384e-05,
241
- "loss": 0.15243392944335937,
242
- "mean_token_accuracy": 0.9648605918884278,
243
- "num_tokens": 3119188.0,
244
- "step": 475
245
- },
246
- {
247
- "entropy": 0.16782964013516902,
248
- "epoch": 5.0,
249
- "grad_norm": 0.6274464726448059,
250
- "learning_rate": 4.141021868573054e-05,
251
- "loss": 0.13563241958618164,
252
- "mean_token_accuracy": 0.9677622270584106,
253
- "num_tokens": 3284455.0,
254
- "step": 500
255
- },
256
- {
257
- "epoch": 5.0,
258
- "eval_entropy": 0.24806818537987196,
259
- "eval_loss": 0.23999404907226562,
260
- "eval_mean_token_accuracy": 0.94236238186176,
261
- "eval_num_tokens": 3284455.0,
262
- "eval_runtime": 13.8607,
263
- "eval_samples_per_second": 7.215,
264
- "eval_steps_per_second": 0.938,
265
- "step": 500
266
- },
267
- {
268
- "entropy": 0.14203706838190555,
269
- "epoch": 5.25,
270
- "grad_norm": 0.36970171332359314,
271
- "learning_rate": 3.820540678597942e-05,
272
- "loss": 0.11182730674743652,
273
- "mean_token_accuracy": 0.9730106520652771,
274
- "num_tokens": 3449400.0,
275
- "step": 525
276
- },
277
- {
278
- "entropy": 0.14063048042356968,
279
- "epoch": 5.5,
280
- "grad_norm": 0.4689595401287079,
281
- "learning_rate": 3.5012115116750614e-05,
282
- "loss": 0.10328823089599609,
283
- "mean_token_accuracy": 0.9750873637199402,
284
- "num_tokens": 3613152.0,
285
- "step": 550
286
- },
287
- {
288
- "entropy": 0.1214561627060175,
289
- "epoch": 5.75,
290
- "grad_norm": 0.6624268293380737,
291
- "learning_rate": 3.185084272811698e-05,
292
- "loss": 0.10185833930969239,
293
- "mean_token_accuracy": 0.9768549478054047,
294
- "num_tokens": 3776158.0,
295
- "step": 575
296
- },
297
- {
298
- "entropy": 0.12324205733835697,
299
- "epoch": 6.0,
300
- "grad_norm": 0.41641563177108765,
301
- "learning_rate": 2.8741883125245267e-05,
302
- "loss": 0.09359997749328614,
303
- "mean_token_accuracy": 0.9770605981349945,
304
- "num_tokens": 3941346.0,
305
- "step": 600
306
- },
307
- {
308
- "epoch": 6.0,
309
- "eval_entropy": 0.19075566071730393,
310
- "eval_loss": 0.212307408452034,
311
- "eval_mean_token_accuracy": 0.9502005072740408,
312
- "eval_num_tokens": 3941346.0,
313
- "eval_runtime": 13.9707,
314
- "eval_samples_per_second": 7.158,
315
- "eval_steps_per_second": 0.931,
316
- "step": 600
317
- },
318
- {
319
- "entropy": 0.12877136506140233,
320
- "epoch": 6.25,
321
- "grad_norm": 0.2692393362522125,
322
- "learning_rate": 2.5705193996055977e-05,
323
- "loss": 0.1031882667541504,
324
- "mean_token_accuracy": 0.9761876916885376,
325
- "num_tokens": 4106933.0,
326
- "step": 625
327
- },
328
- {
329
- "entropy": 0.08486215136945248,
330
- "epoch": 6.5,
331
- "grad_norm": 0.3272198438644409,
332
- "learning_rate": 2.2760269094631983e-05,
333
- "loss": 0.056387810707092284,
334
- "mean_token_accuracy": 0.9854865920543671,
335
- "num_tokens": 4268402.0,
336
- "step": 650
337
- },
338
- {
339
- "entropy": 0.11242001455277205,
340
- "epoch": 6.75,
341
- "grad_norm": 0.6421979665756226,
342
- "learning_rate": 1.992601310280891e-05,
343
- "loss": 0.09050872802734375,
344
- "mean_token_accuracy": 0.9787377977371216,
345
- "num_tokens": 4434736.0,
346
- "step": 675
347
- },
348
- {
349
- "entropy": 0.0798944342881441,
350
- "epoch": 7.0,
351
- "grad_norm": 0.35506346821784973,
352
- "learning_rate": 1.7220620273261923e-05,
353
- "loss": 0.050995888710021975,
354
- "mean_token_accuracy": 0.9863569080829621,
355
- "num_tokens": 4598237.0,
356
- "step": 700
357
- },
358
- {
359
- "epoch": 7.0,
360
- "eval_entropy": 0.16236452701000068,
361
- "eval_loss": 0.19433234632015228,
362
- "eval_mean_token_accuracy": 0.9543979305487412,
363
- "eval_num_tokens": 4598237.0,
364
- "eval_runtime": 13.9752,
365
- "eval_samples_per_second": 7.156,
366
- "eval_steps_per_second": 0.93,
367
- "step": 700
368
- },
369
- {
370
- "entropy": 0.10178964871913194,
371
- "epoch": 7.25,
372
- "grad_norm": 0.26595374941825867,
373
- "learning_rate": 1.466145763312922e-05,
374
- "loss": 0.07614684581756592,
375
- "mean_token_accuracy": 0.9819281613826751,
376
- "num_tokens": 4762560.0,
377
- "step": 725
378
- },
379
- {
380
- "entropy": 0.09404424335807562,
381
- "epoch": 7.5,
382
- "grad_norm": 0.23222072422504425,
383
- "learning_rate": 1.2264953497935479e-05,
384
- "loss": 0.06552838802337646,
385
- "mean_token_accuracy": 0.9836024832725525,
386
- "num_tokens": 4927776.0,
387
- "step": 750
388
- },
389
- {
390
- "entropy": 0.05591522835195065,
391
- "epoch": 7.75,
392
- "grad_norm": 0.24831674993038177,
393
- "learning_rate": 1.0046492011490874e-05,
394
- "loss": 0.034845557212829587,
395
- "mean_token_accuracy": 0.9901663279533386,
396
- "num_tokens": 5093008.0,
397
- "step": 775
398
- },
399
- {
400
- "entropy": 0.079307572953403,
401
- "epoch": 8.0,
402
- "grad_norm": 0.18024076521396637,
403
- "learning_rate": 8.020314388756562e-06,
404
- "loss": 0.050776734352111816,
405
- "mean_token_accuracy": 0.9873624122142792,
406
- "num_tokens": 5255128.0,
407
- "step": 800
408
- },
409
- {
410
- "epoch": 8.0,
411
- "eval_entropy": 0.15024888830689284,
412
- "eval_loss": 0.1804545819759369,
413
- "eval_mean_token_accuracy": 0.9596647941149198,
414
- "eval_num_tokens": 5255128.0,
415
- "eval_runtime": 14.1896,
416
- "eval_samples_per_second": 7.047,
417
- "eval_steps_per_second": 0.916,
418
- "step": 800
419
- },
420
- {
421
- "entropy": 0.05522842925041914,
422
- "epoch": 8.25,
423
- "grad_norm": 0.2229844033718109,
424
- "learning_rate": 6.199427495639963e-06,
425
- "loss": 0.029806861877441405,
426
- "mean_token_accuracy": 0.9915253543853759,
427
- "num_tokens": 5418711.0,
428
- "step": 825
429
- },
430
- {
431
- "entropy": 0.08227874159812927,
432
- "epoch": 8.5,
433
- "grad_norm": 0.21011501550674438,
434
- "learning_rate": 4.595520352583061e-06,
435
- "loss": 0.049187426567077634,
436
- "mean_token_accuracy": 0.9874508118629456,
437
- "num_tokens": 5585074.0,
438
- "step": 850
439
- },
440
- {
441
- "entropy": 0.07059245463460684,
442
- "epoch": 8.75,
443
- "grad_norm": 0.2088802009820938,
444
- "learning_rate": 3.2188890979419772e-06,
445
- "loss": 0.04377749443054199,
446
- "mean_token_accuracy": 0.9887262201309204,
447
- "num_tokens": 5748942.0,
448
- "step": 875
449
- },
450
- {
451
- "entropy": 0.0844693697988987,
452
- "epoch": 9.0,
453
- "grad_norm": 0.47332102060317993,
454
- "learning_rate": 2.078370892848134e-06,
455
- "loss": 0.05981508731842041,
456
- "mean_token_accuracy": 0.9852988374233246,
457
- "num_tokens": 5912019.0,
458
- "step": 900
459
- },
460
- {
461
- "epoch": 9.0,
462
- "eval_entropy": 0.14602531578678352,
463
- "eval_loss": 0.1760927140712738,
464
- "eval_mean_token_accuracy": 0.9613595421497638,
465
- "eval_num_tokens": 5912019.0,
466
- "eval_runtime": 14.0785,
467
- "eval_samples_per_second": 7.103,
468
- "eval_steps_per_second": 0.923,
469
- "step": 900
470
- },
471
- {
472
- "entropy": 0.07264392349869013,
473
- "epoch": 9.25,
474
- "grad_norm": 0.1500307023525238,
475
- "learning_rate": 1.1812871918434143e-06,
476
- "loss": 0.04127415180206299,
477
- "mean_token_accuracy": 0.9900540256500244,
478
- "num_tokens": 6076215.0,
479
- "step": 925
480
- },
481
- {
482
- "entropy": 0.06510979659855366,
483
- "epoch": 9.5,
484
- "grad_norm": 0.18775677680969238,
485
- "learning_rate": 5.333967434579324e-07,
486
- "loss": 0.03701672554016113,
487
- "mean_token_accuracy": 0.9901195931434631,
488
- "num_tokens": 6239231.0,
489
- "step": 950
490
- },
491
- {
492
- "entropy": 0.07681083966046572,
493
- "epoch": 9.75,
494
- "grad_norm": 0.14990992844104767,
495
- "learning_rate": 1.3885862243927072e-07,
496
- "loss": 0.050642023086547854,
497
- "mean_token_accuracy": 0.9876152622699738,
498
- "num_tokens": 6404599.0,
499
- "step": 975
500
- },
501
- {
502
- "entropy": 0.0641748109832406,
503
- "epoch": 10.0,
504
- "grad_norm": 0.16811969876289368,
505
- "learning_rate": 2.0553094437492095e-10,
506
- "loss": 0.039728012084960934,
507
- "mean_token_accuracy": 0.9897483742237091,
508
- "num_tokens": 6568910.0,
509
- "step": 1000
510
- },
511
- {
512
- "epoch": 10.0,
513
- "eval_entropy": 0.1441301224896541,
514
- "eval_loss": 0.17693637311458588,
515
- "eval_mean_token_accuracy": 0.9611430030602676,
516
- "eval_num_tokens": 6568910.0,
517
- "eval_runtime": 14.0079,
518
- "eval_samples_per_second": 7.139,
519
- "eval_steps_per_second": 0.928,
520
- "step": 1000
521
- }
522
- ],
523
- "logging_steps": 25,
524
- "max_steps": 1000,
525
- "num_input_tokens_seen": 0,
526
- "num_train_epochs": 10,
527
- "save_steps": 500,
528
- "stateful_callbacks": {
529
- "EarlyStoppingCallback": {
530
- "args": {
531
- "early_stopping_patience": 2,
532
- "early_stopping_threshold": 0.0
533
- },
534
- "attributes": {
535
- "early_stopping_patience_counter": 1
536
- }
537
- },
538
- "TrainerControl": {
539
- "args": {
540
- "should_epoch_stop": false,
541
- "should_evaluate": false,
542
- "should_log": false,
543
- "should_save": true,
544
- "should_training_stop": true
545
- },
546
- "attributes": {}
547
- }
548
- },
549
- "total_flos": 3.4511362480123085e+17,
550
- "train_batch_size": 4,
551
- "trial_name": null,
552
- "trial_params": null
553
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-1000/training_args.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:1e28aed9c09299882a0a85d4a5e7b5f033f6f0f96c839015b54f530ff1cc1760
3
- size 5368
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-900/README.md DELETED
@@ -1,209 +0,0 @@
1
- ---
2
- base_model: /scr/user/kevin2002/TensorCat/NLP/UM_Handbook/models/Qwen3-8B
3
- library_name: peft
4
- pipeline_tag: text-generation
5
- tags:
6
- - base_model:adapter:/scr/user/kevin2002/TensorCat/NLP/UM_Handbook/models/Qwen3-8B
7
- - lora
8
- - sft
9
- - transformers
10
- - trl
11
- ---
12
-
13
- # Model Card for Model ID
14
-
15
- <!-- Provide a quick summary of what the model is/does. -->
16
-
17
-
18
-
19
- ## Model Details
20
-
21
- ### Model Description
22
-
23
- <!-- Provide a longer summary of what this model is. -->
24
-
25
-
26
-
27
- - **Developed by:** [More Information Needed]
28
- - **Funded by [optional]:** [More Information Needed]
29
- - **Shared by [optional]:** [More Information Needed]
30
- - **Model type:** [More Information Needed]
31
- - **Language(s) (NLP):** [More Information Needed]
32
- - **License:** [More Information Needed]
33
- - **Finetuned from model [optional]:** [More Information Needed]
34
-
35
- ### Model Sources [optional]
36
-
37
- <!-- Provide the basic links for the model. -->
38
-
39
- - **Repository:** [More Information Needed]
40
- - **Paper [optional]:** [More Information Needed]
41
- - **Demo [optional]:** [More Information Needed]
42
-
43
- ## Uses
44
-
45
- <!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
46
-
47
- ### Direct Use
48
-
49
- <!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
50
-
51
- [More Information Needed]
52
-
53
- ### Downstream Use [optional]
54
-
55
- <!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
56
-
57
- [More Information Needed]
58
-
59
- ### Out-of-Scope Use
60
-
61
- <!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
62
-
63
- [More Information Needed]
64
-
65
- ## Bias, Risks, and Limitations
66
-
67
- <!-- This section is meant to convey both technical and sociotechnical limitations. -->
68
-
69
- [More Information Needed]
70
-
71
- ### Recommendations
72
-
73
- <!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
74
-
75
- Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
76
-
77
- ## How to Get Started with the Model
78
-
79
- Use the code below to get started with the model.
80
-
81
- [More Information Needed]
82
-
83
- ## Training Details
84
-
85
- ### Training Data
86
-
87
- <!-- This should link to a Dataset Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
88
-
89
- [More Information Needed]
90
-
91
- ### Training Procedure
92
-
93
- <!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
94
-
95
- #### Preprocessing [optional]
96
-
97
- [More Information Needed]
98
-
99
-
100
- #### Training Hyperparameters
101
-
102
- - **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
103
-
104
- #### Speeds, Sizes, Times [optional]
105
-
106
- <!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
107
-
108
- [More Information Needed]
109
-
110
- ## Evaluation
111
-
112
- <!-- This section describes the evaluation protocols and provides the results. -->
113
-
114
- ### Testing Data, Factors & Metrics
115
-
116
- #### Testing Data
117
-
118
- <!-- This should link to a Dataset Card if possible. -->
119
-
120
- [More Information Needed]
121
-
122
- #### Factors
123
-
124
- <!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
125
-
126
- [More Information Needed]
127
-
128
- #### Metrics
129
-
130
- <!-- These are the evaluation metrics being used, ideally with a description of why. -->
131
-
132
- [More Information Needed]
133
-
134
- ### Results
135
-
136
- [More Information Needed]
137
-
138
- #### Summary
139
-
140
-
141
-
142
- ## Model Examination [optional]
143
-
144
- <!-- Relevant interpretability work for the model goes here -->
145
-
146
- [More Information Needed]
147
-
148
- ## Environmental Impact
149
-
150
- <!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
151
-
152
- Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
153
-
154
- - **Hardware Type:** [More Information Needed]
155
- - **Hours used:** [More Information Needed]
156
- - **Cloud Provider:** [More Information Needed]
157
- - **Compute Region:** [More Information Needed]
158
- - **Carbon Emitted:** [More Information Needed]
159
-
160
- ## Technical Specifications [optional]
161
-
162
- ### Model Architecture and Objective
163
-
164
- [More Information Needed]
165
-
166
- ### Compute Infrastructure
167
-
168
- [More Information Needed]
169
-
170
- #### Hardware
171
-
172
- [More Information Needed]
173
-
174
- #### Software
175
-
176
- [More Information Needed]
177
-
178
- ## Citation [optional]
179
-
180
- <!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
181
-
182
- **BibTeX:**
183
-
184
- [More Information Needed]
185
-
186
- **APA:**
187
-
188
- [More Information Needed]
189
-
190
- ## Glossary [optional]
191
-
192
- <!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
193
-
194
- [More Information Needed]
195
-
196
- ## More Information [optional]
197
-
198
- [More Information Needed]
199
-
200
- ## Model Card Authors [optional]
201
-
202
- [More Information Needed]
203
-
204
- ## Model Card Contact
205
-
206
- [More Information Needed]
207
- ### Framework versions
208
-
209
- - PEFT 0.18.1
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-900/adapter_config.json DELETED
@@ -1,46 +0,0 @@
1
- {
2
- "alora_invocation_tokens": null,
3
- "alpha_pattern": {},
4
- "arrow_config": null,
5
- "auto_mapping": null,
6
- "base_model_name_or_path": "/scr/user/kevin2002/TensorCat/NLP/UM_Handbook/models/Qwen3-8B",
7
- "bias": "none",
8
- "corda_config": null,
9
- "ensure_weight_tying": false,
10
- "eva_config": null,
11
- "exclude_modules": null,
12
- "fan_in_fan_out": false,
13
- "inference_mode": true,
14
- "init_lora_weights": true,
15
- "layer_replication": null,
16
- "layers_pattern": null,
17
- "layers_to_transform": null,
18
- "loftq_config": {},
19
- "lora_alpha": 16,
20
- "lora_bias": false,
21
- "lora_dropout": 0.05,
22
- "megatron_config": null,
23
- "megatron_core": "megatron.core",
24
- "modules_to_save": null,
25
- "peft_type": "LORA",
26
- "peft_version": "0.18.1",
27
- "qalora_group_size": 16,
28
- "r": 8,
29
- "rank_pattern": {},
30
- "revision": null,
31
- "target_modules": [
32
- "o_proj",
33
- "up_proj",
34
- "q_proj",
35
- "down_proj",
36
- "k_proj",
37
- "v_proj",
38
- "gate_proj"
39
- ],
40
- "target_parameters": null,
41
- "task_type": "CAUSAL_LM",
42
- "trainable_token_indices": null,
43
- "use_dora": false,
44
- "use_qalora": false,
45
- "use_rslora": false
46
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-900/adapter_model.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:6833958e7d1e52733a02c8675c398188d65dd02aed1c0cd026a6235c32247d7d
3
- size 87360584
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-900/chat_template.jinja DELETED
@@ -1,89 +0,0 @@
1
- {%- if tools %}
2
- {{- '<|im_start|>system\n' }}
3
- {%- if messages[0].role == 'system' %}
4
- {{- messages[0].content + '\n\n' }}
5
- {%- endif %}
6
- {{- "# Tools\n\nYou may call one or more functions to assist with the user query.\n\nYou are provided with function signatures within <tools></tools> XML tags:\n<tools>" }}
7
- {%- for tool in tools %}
8
- {{- "\n" }}
9
- {{- tool | tojson }}
10
- {%- endfor %}
11
- {{- "\n</tools>\n\nFor each function call, return a json object with function name and arguments within <tool_call></tool_call> XML tags:\n<tool_call>\n{\"name\": <function-name>, \"arguments\": <args-json-object>}\n</tool_call><|im_end|>\n" }}
12
- {%- else %}
13
- {%- if messages[0].role == 'system' %}
14
- {{- '<|im_start|>system\n' + messages[0].content + '<|im_end|>\n' }}
15
- {%- endif %}
16
- {%- endif %}
17
- {%- set ns = namespace(multi_step_tool=true, last_query_index=messages|length - 1) %}
18
- {%- for message in messages[::-1] %}
19
- {%- set index = (messages|length - 1) - loop.index0 %}
20
- {%- if ns.multi_step_tool and message.role == "user" and message.content is string and not(message.content.startswith('<tool_response>') and message.content.endswith('</tool_response>')) %}
21
- {%- set ns.multi_step_tool = false %}
22
- {%- set ns.last_query_index = index %}
23
- {%- endif %}
24
- {%- endfor %}
25
- {%- for message in messages %}
26
- {%- if message.content is string %}
27
- {%- set content = message.content %}
28
- {%- else %}
29
- {%- set content = '' %}
30
- {%- endif %}
31
- {%- if (message.role == "user") or (message.role == "system" and not loop.first) %}
32
- {{- '<|im_start|>' + message.role + '\n' + content + '<|im_end|>' + '\n' }}
33
- {%- elif message.role == "assistant" %}
34
- {%- set reasoning_content = '' %}
35
- {%- if message.reasoning_content is string %}
36
- {%- set reasoning_content = message.reasoning_content %}
37
- {%- else %}
38
- {%- if '</think>' in content %}
39
- {%- set reasoning_content = content.split('</think>')[0].rstrip('\n').split('<think>')[-1].lstrip('\n') %}
40
- {%- set content = content.split('</think>')[-1].lstrip('\n') %}
41
- {%- endif %}
42
- {%- endif %}
43
- {%- if loop.index0 > ns.last_query_index %}
44
- {%- if loop.last or (not loop.last and reasoning_content) %}
45
- {{- '<|im_start|>' + message.role + '\n<think>\n' + reasoning_content.strip('\n') + '\n</think>\n\n' + content.lstrip('\n') }}
46
- {%- else %}
47
- {{- '<|im_start|>' + message.role + '\n' + content }}
48
- {%- endif %}
49
- {%- else %}
50
- {{- '<|im_start|>' + message.role + '\n' + content }}
51
- {%- endif %}
52
- {%- if message.tool_calls %}
53
- {%- for tool_call in message.tool_calls %}
54
- {%- if (loop.first and content) or (not loop.first) %}
55
- {{- '\n' }}
56
- {%- endif %}
57
- {%- if tool_call.function %}
58
- {%- set tool_call = tool_call.function %}
59
- {%- endif %}
60
- {{- '<tool_call>\n{"name": "' }}
61
- {{- tool_call.name }}
62
- {{- '", "arguments": ' }}
63
- {%- if tool_call.arguments is string %}
64
- {{- tool_call.arguments }}
65
- {%- else %}
66
- {{- tool_call.arguments | tojson }}
67
- {%- endif %}
68
- {{- '}\n</tool_call>' }}
69
- {%- endfor %}
70
- {%- endif %}
71
- {{- '<|im_end|>\n' }}
72
- {%- elif message.role == "tool" %}
73
- {%- if loop.first or (messages[loop.index0 - 1].role != "tool") %}
74
- {{- '<|im_start|>user' }}
75
- {%- endif %}
76
- {{- '\n<tool_response>\n' }}
77
- {{- content }}
78
- {{- '\n</tool_response>' }}
79
- {%- if loop.last or (messages[loop.index0 + 1].role != "tool") %}
80
- {{- '<|im_end|>\n' }}
81
- {%- endif %}
82
- {%- endif %}
83
- {%- endfor %}
84
- {%- if add_generation_prompt %}
85
- {{- '<|im_start|>assistant\n' }}
86
- {%- if enable_thinking is defined and enable_thinking is false %}
87
- {{- '<think>\n\n</think>\n\n' }}
88
- {%- endif %}
89
- {%- endif %}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-900/optimizer.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:fca3a6b6926e387ce5e8867917b7977287b1abf00aeb93d66de9fe91a4b24081
3
- size 175019258
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-900/rng_state.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:3a5e2e570ef212d0b674ff90b61d587dbff40e569cadb167a64af276f7f11bc7
3
- size 14244
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-900/scheduler.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:9977e0a9717c002babb72ef706701cc0854ceb0f70cd11e46964e9964a47741d
3
- size 1064
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-900/tokenizer.json DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:be75606093db2094d7cd20f3c2f385c212750648bd6ea4fb2bf507a6a4c55506
3
- size 11422650
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-900/tokenizer_config.json DELETED
@@ -1,29 +0,0 @@
1
- {
2
- "add_prefix_space": false,
3
- "backend": "tokenizers",
4
- "bos_token": null,
5
- "clean_up_tokenization_spaces": false,
6
- "eos_token": "<|im_end|>",
7
- "errors": "replace",
8
- "extra_special_tokens": [
9
- "<|im_start|>",
10
- "<|im_end|>",
11
- "<|object_ref_start|>",
12
- "<|object_ref_end|>",
13
- "<|box_start|>",
14
- "<|box_end|>",
15
- "<|quad_start|>",
16
- "<|quad_end|>",
17
- "<|vision_start|>",
18
- "<|vision_end|>",
19
- "<|vision_pad|>",
20
- "<|image_pad|>",
21
- "<|video_pad|>"
22
- ],
23
- "is_local": true,
24
- "model_max_length": 131072,
25
- "pad_token": "<|endoftext|>",
26
- "split_special_tokens": false,
27
- "tokenizer_class": "Qwen2Tokenizer",
28
- "unk_token": null
29
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-900/trainer_state.json DELETED
@@ -1,502 +0,0 @@
1
- {
2
- "best_global_step": 900,
3
- "best_metric": 0.1760927140712738,
4
- "best_model_checkpoint": "/scr/user/kevin2002/TensorCat/NLP/UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-900",
5
- "epoch": 9.0,
6
- "eval_steps": 500,
7
- "global_step": 900,
8
- "is_hyper_param_search": false,
9
- "is_local_process_zero": true,
10
- "is_world_process_zero": true,
11
- "log_history": [
12
- {
13
- "entropy": 1.4358372974395752,
14
- "epoch": 0.25,
15
- "grad_norm": 0.14446501433849335,
16
- "learning_rate": 7.999671154713278e-05,
17
- "loss": 2.3676884460449217,
18
- "mean_token_accuracy": 0.5813838094472885,
19
- "num_tokens": 160725.0,
20
- "step": 25
21
- },
22
- {
23
- "entropy": 1.879828963279724,
24
- "epoch": 0.5,
25
- "grad_norm": 0.15517809987068176,
26
- "learning_rate": 7.982727278231343e-05,
27
- "loss": 1.7838900756835938,
28
- "mean_token_accuracy": 0.6484150147438049,
29
- "num_tokens": 327066.0,
30
- "step": 50
31
- },
32
- {
33
- "entropy": 1.4648912394046782,
34
- "epoch": 0.75,
35
- "grad_norm": 0.1660589873790741,
36
- "learning_rate": 7.940216640438628e-05,
37
- "loss": 1.4690559387207032,
38
- "mean_token_accuracy": 0.7019884788990021,
39
- "num_tokens": 490539.0,
40
- "step": 75
41
- },
42
- {
43
- "entropy": 1.3251829946041107,
44
- "epoch": 1.0,
45
- "grad_norm": 0.2699568569660187,
46
- "learning_rate": 7.872412134569766e-05,
47
- "loss": 1.312823028564453,
48
- "mean_token_accuracy": 0.726642736196518,
49
- "num_tokens": 656891.0,
50
- "step": 100
51
- },
52
- {
53
- "epoch": 1.0,
54
- "eval_entropy": 1.1702604523071876,
55
- "eval_loss": 1.1601083278656006,
56
- "eval_mean_token_accuracy": 0.7461812725433936,
57
- "eval_num_tokens": 656891.0,
58
- "eval_runtime": 14.1848,
59
- "eval_samples_per_second": 7.05,
60
- "eval_steps_per_second": 0.916,
61
- "step": 100
62
- },
63
- {
64
- "entropy": 0.9866749036312104,
65
- "epoch": 1.25,
66
- "grad_norm": 0.41134113073349,
67
- "learning_rate": 7.779749025581717e-05,
68
- "loss": 0.994763412475586,
69
- "mean_token_accuracy": 0.777331509590149,
70
- "num_tokens": 820900.0,
71
- "step": 125
72
- },
73
- {
74
- "entropy": 0.901508281826973,
75
- "epoch": 1.5,
76
- "grad_norm": 0.48528075218200684,
77
- "learning_rate": 7.662822156009336e-05,
78
- "loss": 0.903388442993164,
79
- "mean_token_accuracy": 0.8035100996494293,
80
- "num_tokens": 983751.0,
81
- "step": 150
82
- },
83
- {
84
- "entropy": 0.7128595209121704,
85
- "epoch": 1.75,
86
- "grad_norm": 0.5612214207649231,
87
- "learning_rate": 7.522382127426952e-05,
88
- "loss": 0.6967535400390625,
89
- "mean_token_accuracy": 0.8427894067764282,
90
- "num_tokens": 1148624.0,
91
- "step": 175
92
- },
93
- {
94
- "entropy": 0.5692075723409653,
95
- "epoch": 2.0,
96
- "grad_norm": 0.5570225715637207,
97
- "learning_rate": 7.35933048202875e-05,
98
- "loss": 0.5440200424194336,
99
- "mean_token_accuracy": 0.8759966826438904,
100
- "num_tokens": 1313782.0,
101
- "step": 200
102
- },
103
- {
104
- "epoch": 2.0,
105
- "eval_entropy": 0.6419096955886254,
106
- "eval_loss": 0.600500226020813,
107
- "eval_mean_token_accuracy": 0.861496246778048,
108
- "eval_num_tokens": 1313782.0,
109
- "eval_runtime": 14.1469,
110
- "eval_samples_per_second": 7.069,
111
- "eval_steps_per_second": 0.919,
112
- "step": 200
113
- },
114
- {
115
- "entropy": 0.44877232432365416,
116
- "epoch": 2.25,
117
- "grad_norm": 0.5958295464515686,
118
- "learning_rate": 7.174713915259331e-05,
119
- "loss": 0.41493446350097657,
120
- "mean_token_accuracy": 0.9032380354404449,
121
- "num_tokens": 1480714.0,
122
- "step": 225
123
- },
124
- {
125
- "entropy": 0.4503101620078087,
126
- "epoch": 2.5,
127
- "grad_norm": 0.7803889513015747,
128
- "learning_rate": 6.969717556645995e-05,
129
- "loss": 0.42063777923583984,
130
- "mean_token_accuracy": 0.9064690721035004,
131
- "num_tokens": 1645148.0,
132
- "step": 250
133
- },
134
- {
135
- "entropy": 0.3513291063904762,
136
- "epoch": 2.75,
137
- "grad_norm": 0.5489973425865173,
138
- "learning_rate": 6.745657361965803e-05,
139
- "loss": 0.32174919128417967,
140
- "mean_token_accuracy": 0.9250416386127472,
141
- "num_tokens": 1805051.0,
142
- "step": 275
143
- },
144
- {
145
- "entropy": 0.3790210232138634,
146
- "epoch": 3.0,
147
- "grad_norm": 0.9119548797607422,
148
- "learning_rate": 6.503971665585243e-05,
149
- "loss": 0.3341722106933594,
150
- "mean_token_accuracy": 0.9239817559719086,
151
- "num_tokens": 1970673.0,
152
- "step": 300
153
- },
154
- {
155
- "epoch": 3.0,
156
- "eval_entropy": 0.4204630897595332,
157
- "eval_loss": 0.38708260655403137,
158
- "eval_mean_token_accuracy": 0.9079863979266241,
159
- "eval_num_tokens": 1970673.0,
160
- "eval_runtime": 14.1106,
161
- "eval_samples_per_second": 7.087,
162
- "eval_steps_per_second": 0.921,
163
- "step": 300
164
- },
165
- {
166
- "entropy": 0.2572793909907341,
167
- "epoch": 3.25,
168
- "grad_norm": 0.4237155020236969,
169
- "learning_rate": 6.2462119472015e-05,
170
- "loss": 0.20618080139160155,
171
- "mean_token_accuracy": 0.9494317126274109,
172
- "num_tokens": 2133206.0,
173
- "step": 325
174
- },
175
- {
176
- "entropy": 0.29035701289772986,
177
- "epoch": 3.5,
178
- "grad_norm": 0.6824076175689697,
179
- "learning_rate": 5.974032872257388e-05,
180
- "loss": 0.25118282318115237,
181
- "mean_token_accuracy": 0.9438021230697632,
182
- "num_tokens": 2297449.0,
183
- "step": 350
184
- },
185
- {
186
- "entropy": 0.23607211165130138,
187
- "epoch": 3.75,
188
- "grad_norm": 0.8003197908401489,
189
- "learning_rate": 5.68918166996464e-05,
190
- "loss": 0.19911937713623046,
191
- "mean_token_accuracy": 0.9537552082538605,
192
- "num_tokens": 2462390.0,
193
- "step": 375
194
- },
195
- {
196
- "entropy": 0.23902728497982026,
197
- "epoch": 4.0,
198
- "grad_norm": 0.8474582433700562,
199
- "learning_rate": 5.393486917122353e-05,
200
- "loss": 0.20467203140258788,
201
- "mean_token_accuracy": 0.9515939724445343,
202
- "num_tokens": 2627564.0,
203
- "step": 400
204
- },
205
- {
206
- "epoch": 4.0,
207
- "eval_entropy": 0.31223052740097046,
208
- "eval_loss": 0.2847066819667816,
209
- "eval_mean_token_accuracy": 0.9322063556084266,
210
- "eval_num_tokens": 2627564.0,
211
- "eval_runtime": 13.9402,
212
- "eval_samples_per_second": 7.174,
213
- "eval_steps_per_second": 0.933,
214
- "step": 400
215
- },
216
- {
217
- "entropy": 0.17765841275453567,
218
- "epoch": 4.25,
219
- "grad_norm": 0.5740338563919067,
220
- "learning_rate": 5.088846799731885e-05,
221
- "loss": 0.13823826789855956,
222
- "mean_token_accuracy": 0.9671606945991517,
223
- "num_tokens": 2789214.0,
224
- "step": 425
225
- },
226
- {
227
- "entropy": 0.18791945070028304,
228
- "epoch": 4.5,
229
- "grad_norm": 0.30488306283950806,
230
- "learning_rate": 4.7772169277617086e-05,
231
- "loss": 0.14581723213195802,
232
- "mean_token_accuracy": 0.9664597606658936,
233
- "num_tokens": 2955470.0,
234
- "step": 450
235
- },
236
- {
237
- "entropy": 0.18473084963858127,
238
- "epoch": 4.75,
239
- "grad_norm": 0.5409578084945679,
240
- "learning_rate": 4.4605977812842384e-05,
241
- "loss": 0.15243392944335937,
242
- "mean_token_accuracy": 0.9648605918884278,
243
- "num_tokens": 3119188.0,
244
- "step": 475
245
- },
246
- {
247
- "entropy": 0.16782964013516902,
248
- "epoch": 5.0,
249
- "grad_norm": 0.6274464726448059,
250
- "learning_rate": 4.141021868573054e-05,
251
- "loss": 0.13563241958618164,
252
- "mean_token_accuracy": 0.9677622270584106,
253
- "num_tokens": 3284455.0,
254
- "step": 500
255
- },
256
- {
257
- "epoch": 5.0,
258
- "eval_entropy": 0.24806818537987196,
259
- "eval_loss": 0.23999404907226562,
260
- "eval_mean_token_accuracy": 0.94236238186176,
261
- "eval_num_tokens": 3284455.0,
262
- "eval_runtime": 13.8607,
263
- "eval_samples_per_second": 7.215,
264
- "eval_steps_per_second": 0.938,
265
- "step": 500
266
- },
267
- {
268
- "entropy": 0.14203706838190555,
269
- "epoch": 5.25,
270
- "grad_norm": 0.36970171332359314,
271
- "learning_rate": 3.820540678597942e-05,
272
- "loss": 0.11182730674743652,
273
- "mean_token_accuracy": 0.9730106520652771,
274
- "num_tokens": 3449400.0,
275
- "step": 525
276
- },
277
- {
278
- "entropy": 0.14063048042356968,
279
- "epoch": 5.5,
280
- "grad_norm": 0.4689595401287079,
281
- "learning_rate": 3.5012115116750614e-05,
282
- "loss": 0.10328823089599609,
283
- "mean_token_accuracy": 0.9750873637199402,
284
- "num_tokens": 3613152.0,
285
- "step": 550
286
- },
287
- {
288
- "entropy": 0.1214561627060175,
289
- "epoch": 5.75,
290
- "grad_norm": 0.6624268293380737,
291
- "learning_rate": 3.185084272811698e-05,
292
- "loss": 0.10185833930969239,
293
- "mean_token_accuracy": 0.9768549478054047,
294
- "num_tokens": 3776158.0,
295
- "step": 575
296
- },
297
- {
298
- "entropy": 0.12324205733835697,
299
- "epoch": 6.0,
300
- "grad_norm": 0.41641563177108765,
301
- "learning_rate": 2.8741883125245267e-05,
302
- "loss": 0.09359997749328614,
303
- "mean_token_accuracy": 0.9770605981349945,
304
- "num_tokens": 3941346.0,
305
- "step": 600
306
- },
307
- {
308
- "epoch": 6.0,
309
- "eval_entropy": 0.19075566071730393,
310
- "eval_loss": 0.212307408452034,
311
- "eval_mean_token_accuracy": 0.9502005072740408,
312
- "eval_num_tokens": 3941346.0,
313
- "eval_runtime": 13.9707,
314
- "eval_samples_per_second": 7.158,
315
- "eval_steps_per_second": 0.931,
316
- "step": 600
317
- },
318
- {
319
- "entropy": 0.12877136506140233,
320
- "epoch": 6.25,
321
- "grad_norm": 0.2692393362522125,
322
- "learning_rate": 2.5705193996055977e-05,
323
- "loss": 0.1031882667541504,
324
- "mean_token_accuracy": 0.9761876916885376,
325
- "num_tokens": 4106933.0,
326
- "step": 625
327
- },
328
- {
329
- "entropy": 0.08486215136945248,
330
- "epoch": 6.5,
331
- "grad_norm": 0.3272198438644409,
332
- "learning_rate": 2.2760269094631983e-05,
333
- "loss": 0.056387810707092284,
334
- "mean_token_accuracy": 0.9854865920543671,
335
- "num_tokens": 4268402.0,
336
- "step": 650
337
- },
338
- {
339
- "entropy": 0.11242001455277205,
340
- "epoch": 6.75,
341
- "grad_norm": 0.6421979665756226,
342
- "learning_rate": 1.992601310280891e-05,
343
- "loss": 0.09050872802734375,
344
- "mean_token_accuracy": 0.9787377977371216,
345
- "num_tokens": 4434736.0,
346
- "step": 675
347
- },
348
- {
349
- "entropy": 0.0798944342881441,
350
- "epoch": 7.0,
351
- "grad_norm": 0.35506346821784973,
352
- "learning_rate": 1.7220620273261923e-05,
353
- "loss": 0.050995888710021975,
354
- "mean_token_accuracy": 0.9863569080829621,
355
- "num_tokens": 4598237.0,
356
- "step": 700
357
- },
358
- {
359
- "epoch": 7.0,
360
- "eval_entropy": 0.16236452701000068,
361
- "eval_loss": 0.19433234632015228,
362
- "eval_mean_token_accuracy": 0.9543979305487412,
363
- "eval_num_tokens": 4598237.0,
364
- "eval_runtime": 13.9752,
365
- "eval_samples_per_second": 7.156,
366
- "eval_steps_per_second": 0.93,
367
- "step": 700
368
- },
369
- {
370
- "entropy": 0.10178964871913194,
371
- "epoch": 7.25,
372
- "grad_norm": 0.26595374941825867,
373
- "learning_rate": 1.466145763312922e-05,
374
- "loss": 0.07614684581756592,
375
- "mean_token_accuracy": 0.9819281613826751,
376
- "num_tokens": 4762560.0,
377
- "step": 725
378
- },
379
- {
380
- "entropy": 0.09404424335807562,
381
- "epoch": 7.5,
382
- "grad_norm": 0.23222072422504425,
383
- "learning_rate": 1.2264953497935479e-05,
384
- "loss": 0.06552838802337646,
385
- "mean_token_accuracy": 0.9836024832725525,
386
- "num_tokens": 4927776.0,
387
- "step": 750
388
- },
389
- {
390
- "entropy": 0.05591522835195065,
391
- "epoch": 7.75,
392
- "grad_norm": 0.24831674993038177,
393
- "learning_rate": 1.0046492011490874e-05,
394
- "loss": 0.034845557212829587,
395
- "mean_token_accuracy": 0.9901663279533386,
396
- "num_tokens": 5093008.0,
397
- "step": 775
398
- },
399
- {
400
- "entropy": 0.079307572953403,
401
- "epoch": 8.0,
402
- "grad_norm": 0.18024076521396637,
403
- "learning_rate": 8.020314388756562e-06,
404
- "loss": 0.050776734352111816,
405
- "mean_token_accuracy": 0.9873624122142792,
406
- "num_tokens": 5255128.0,
407
- "step": 800
408
- },
409
- {
410
- "epoch": 8.0,
411
- "eval_entropy": 0.15024888830689284,
412
- "eval_loss": 0.1804545819759369,
413
- "eval_mean_token_accuracy": 0.9596647941149198,
414
- "eval_num_tokens": 5255128.0,
415
- "eval_runtime": 14.1896,
416
- "eval_samples_per_second": 7.047,
417
- "eval_steps_per_second": 0.916,
418
- "step": 800
419
- },
420
- {
421
- "entropy": 0.05522842925041914,
422
- "epoch": 8.25,
423
- "grad_norm": 0.2229844033718109,
424
- "learning_rate": 6.199427495639963e-06,
425
- "loss": 0.029806861877441405,
426
- "mean_token_accuracy": 0.9915253543853759,
427
- "num_tokens": 5418711.0,
428
- "step": 825
429
- },
430
- {
431
- "entropy": 0.08227874159812927,
432
- "epoch": 8.5,
433
- "grad_norm": 0.21011501550674438,
434
- "learning_rate": 4.595520352583061e-06,
435
- "loss": 0.049187426567077634,
436
- "mean_token_accuracy": 0.9874508118629456,
437
- "num_tokens": 5585074.0,
438
- "step": 850
439
- },
440
- {
441
- "entropy": 0.07059245463460684,
442
- "epoch": 8.75,
443
- "grad_norm": 0.2088802009820938,
444
- "learning_rate": 3.2188890979419772e-06,
445
- "loss": 0.04377749443054199,
446
- "mean_token_accuracy": 0.9887262201309204,
447
- "num_tokens": 5748942.0,
448
- "step": 875
449
- },
450
- {
451
- "entropy": 0.0844693697988987,
452
- "epoch": 9.0,
453
- "grad_norm": 0.47332102060317993,
454
- "learning_rate": 2.078370892848134e-06,
455
- "loss": 0.05981508731842041,
456
- "mean_token_accuracy": 0.9852988374233246,
457
- "num_tokens": 5912019.0,
458
- "step": 900
459
- },
460
- {
461
- "epoch": 9.0,
462
- "eval_entropy": 0.14602531578678352,
463
- "eval_loss": 0.1760927140712738,
464
- "eval_mean_token_accuracy": 0.9613595421497638,
465
- "eval_num_tokens": 5912019.0,
466
- "eval_runtime": 14.0785,
467
- "eval_samples_per_second": 7.103,
468
- "eval_steps_per_second": 0.923,
469
- "step": 900
470
- }
471
- ],
472
- "logging_steps": 25,
473
- "max_steps": 1000,
474
- "num_input_tokens_seen": 0,
475
- "num_train_epochs": 10,
476
- "save_steps": 500,
477
- "stateful_callbacks": {
478
- "EarlyStoppingCallback": {
479
- "args": {
480
- "early_stopping_patience": 2,
481
- "early_stopping_threshold": 0.0
482
- },
483
- "attributes": {
484
- "early_stopping_patience_counter": 0
485
- }
486
- },
487
- "TrainerControl": {
488
- "args": {
489
- "should_epoch_stop": false,
490
- "should_evaluate": false,
491
- "should_log": false,
492
- "should_save": true,
493
- "should_training_stop": false
494
- },
495
- "attributes": {}
496
- }
497
- },
498
- "total_flos": 3.106085652472627e+17,
499
- "train_batch_size": 4,
500
- "trial_name": null,
501
- "trial_params": null
502
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/checkpoint-900/training_args.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:1e28aed9c09299882a0a85d4a5e7b5f033f6f0f96c839015b54f530ff1cc1760
3
- size 5368
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/hf_dataset_dict/dataset_dict.json DELETED
@@ -1 +0,0 @@
1
- {"splits": ["train", "validation", "test"]}
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/hf_dataset_dict/test/data-00000-of-00001.arrow DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:f025159053af787b7124324d5700120792c277fbd717701fed35627723dd5c86
3
- size 787088
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/hf_dataset_dict/test/dataset_info.json DELETED
@@ -1,89 +0,0 @@
1
- {
2
- "citation": "",
3
- "description": "",
4
- "features": {
5
- "qa_id": {
6
- "dtype": "string",
7
- "_type": "Value"
8
- },
9
- "index_id": {
10
- "dtype": "string",
11
- "_type": "Value"
12
- },
13
- "question": {
14
- "dtype": "string",
15
- "_type": "Value"
16
- },
17
- "answer": {
18
- "dtype": "string",
19
- "_type": "Value"
20
- },
21
- "scope_label": {
22
- "dtype": "string",
23
- "_type": "Value"
24
- },
25
- "source_doc": {
26
- "dtype": "string",
27
- "_type": "Value"
28
- },
29
- "section": {
30
- "dtype": "string",
31
- "_type": "Value"
32
- },
33
- "subsection": {
34
- "dtype": "string",
35
- "_type": "Value"
36
- },
37
- "retrieved_kb_ids": {
38
- "feature": {
39
- "dtype": "string",
40
- "_type": "Value"
41
- },
42
- "_type": "Sequence"
43
- },
44
- "retrieved_sections": {
45
- "feature": {
46
- "dtype": "string",
47
- "_type": "Value"
48
- },
49
- "_type": "Sequence"
50
- },
51
- "retrieved_scopes": {
52
- "feature": {
53
- "dtype": "string",
54
- "_type": "Value"
55
- },
56
- "_type": "Sequence"
57
- },
58
- "prompt": [
59
- {
60
- "content": {
61
- "dtype": "string",
62
- "_type": "Value"
63
- },
64
- "role": {
65
- "dtype": "string",
66
- "_type": "Value"
67
- }
68
- }
69
- ],
70
- "completion": [
71
- {
72
- "content": {
73
- "dtype": "string",
74
- "_type": "Value"
75
- },
76
- "role": {
77
- "dtype": "string",
78
- "_type": "Value"
79
- }
80
- }
81
- ],
82
- "text": {
83
- "dtype": "string",
84
- "_type": "Value"
85
- }
86
- },
87
- "homepage": "",
88
- "license": ""
89
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/hf_dataset_dict/test/state.json DELETED
@@ -1,13 +0,0 @@
1
- {
2
- "_data_files": [
3
- {
4
- "filename": "data-00000-of-00001.arrow"
5
- }
6
- ],
7
- "_fingerprint": "936c078af06a1d62",
8
- "_format_columns": null,
9
- "_format_kwargs": {},
10
- "_format_type": null,
11
- "_output_all_columns": false,
12
- "_split": null
13
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/hf_dataset_dict/train/data-00000-of-00001.arrow DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:a886ad01c88df3805ff1754bc09af8c94c3cf72fe5908edaff92b5b70943c8c7
3
- size 6287752
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/hf_dataset_dict/train/dataset_info.json DELETED
@@ -1,89 +0,0 @@
1
- {
2
- "citation": "",
3
- "description": "",
4
- "features": {
5
- "qa_id": {
6
- "dtype": "string",
7
- "_type": "Value"
8
- },
9
- "index_id": {
10
- "dtype": "string",
11
- "_type": "Value"
12
- },
13
- "question": {
14
- "dtype": "string",
15
- "_type": "Value"
16
- },
17
- "answer": {
18
- "dtype": "string",
19
- "_type": "Value"
20
- },
21
- "scope_label": {
22
- "dtype": "string",
23
- "_type": "Value"
24
- },
25
- "source_doc": {
26
- "dtype": "string",
27
- "_type": "Value"
28
- },
29
- "section": {
30
- "dtype": "string",
31
- "_type": "Value"
32
- },
33
- "subsection": {
34
- "dtype": "string",
35
- "_type": "Value"
36
- },
37
- "retrieved_kb_ids": {
38
- "feature": {
39
- "dtype": "string",
40
- "_type": "Value"
41
- },
42
- "_type": "Sequence"
43
- },
44
- "retrieved_sections": {
45
- "feature": {
46
- "dtype": "string",
47
- "_type": "Value"
48
- },
49
- "_type": "Sequence"
50
- },
51
- "retrieved_scopes": {
52
- "feature": {
53
- "dtype": "string",
54
- "_type": "Value"
55
- },
56
- "_type": "Sequence"
57
- },
58
- "prompt": [
59
- {
60
- "content": {
61
- "dtype": "string",
62
- "_type": "Value"
63
- },
64
- "role": {
65
- "dtype": "string",
66
- "_type": "Value"
67
- }
68
- }
69
- ],
70
- "completion": [
71
- {
72
- "content": {
73
- "dtype": "string",
74
- "_type": "Value"
75
- },
76
- "role": {
77
- "dtype": "string",
78
- "_type": "Value"
79
- }
80
- }
81
- ],
82
- "text": {
83
- "dtype": "string",
84
- "_type": "Value"
85
- }
86
- },
87
- "homepage": "",
88
- "license": ""
89
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/hf_dataset_dict/train/state.json DELETED
@@ -1,13 +0,0 @@
1
- {
2
- "_data_files": [
3
- {
4
- "filename": "data-00000-of-00001.arrow"
5
- }
6
- ],
7
- "_fingerprint": "a4eeb3b4abeec226",
8
- "_format_columns": null,
9
- "_format_kwargs": {},
10
- "_format_type": null,
11
- "_output_all_columns": false,
12
- "_split": null
13
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/hf_dataset_dict/validation/data-00000-of-00001.arrow DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:f2e91442ff072666e35d8227c37e03637290a2bfbbff9b277b8fe61cff2b1862
3
- size 782200
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/hf_dataset_dict/validation/dataset_info.json DELETED
@@ -1,89 +0,0 @@
1
- {
2
- "citation": "",
3
- "description": "",
4
- "features": {
5
- "qa_id": {
6
- "dtype": "string",
7
- "_type": "Value"
8
- },
9
- "index_id": {
10
- "dtype": "string",
11
- "_type": "Value"
12
- },
13
- "question": {
14
- "dtype": "string",
15
- "_type": "Value"
16
- },
17
- "answer": {
18
- "dtype": "string",
19
- "_type": "Value"
20
- },
21
- "scope_label": {
22
- "dtype": "string",
23
- "_type": "Value"
24
- },
25
- "source_doc": {
26
- "dtype": "string",
27
- "_type": "Value"
28
- },
29
- "section": {
30
- "dtype": "string",
31
- "_type": "Value"
32
- },
33
- "subsection": {
34
- "dtype": "string",
35
- "_type": "Value"
36
- },
37
- "retrieved_kb_ids": {
38
- "feature": {
39
- "dtype": "string",
40
- "_type": "Value"
41
- },
42
- "_type": "Sequence"
43
- },
44
- "retrieved_sections": {
45
- "feature": {
46
- "dtype": "string",
47
- "_type": "Value"
48
- },
49
- "_type": "Sequence"
50
- },
51
- "retrieved_scopes": {
52
- "feature": {
53
- "dtype": "string",
54
- "_type": "Value"
55
- },
56
- "_type": "Sequence"
57
- },
58
- "prompt": [
59
- {
60
- "content": {
61
- "dtype": "string",
62
- "_type": "Value"
63
- },
64
- "role": {
65
- "dtype": "string",
66
- "_type": "Value"
67
- }
68
- }
69
- ],
70
- "completion": [
71
- {
72
- "content": {
73
- "dtype": "string",
74
- "_type": "Value"
75
- },
76
- "role": {
77
- "dtype": "string",
78
- "_type": "Value"
79
- }
80
- }
81
- ],
82
- "text": {
83
- "dtype": "string",
84
- "_type": "Value"
85
- }
86
- },
87
- "homepage": "",
88
- "license": ""
89
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/hf_dataset_dict/validation/state.json DELETED
@@ -1,13 +0,0 @@
1
- {
2
- "_data_files": [
3
- {
4
- "filename": "data-00000-of-00001.arrow"
5
- }
6
- ],
7
- "_fingerprint": "6cb74bcfac21e0ef",
8
- "_format_columns": null,
9
- "_format_kwargs": {},
10
- "_format_type": null,
11
- "_output_all_columns": false,
12
- "_split": null
13
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
UM_Handbook/outputs/qwen3_um_handbook_baseline2_rag_a100/trainer_runs/train_metrics.json DELETED
@@ -1,7 +0,0 @@
1
- {
2
- "train_runtime": 2492.292,
3
- "train_samples_per_second": 3.21,
4
- "train_steps_per_second": 0.401,
5
- "total_flos": 3.4511362480123085e+17,
6
- "train_loss": 0.35718383276462556
7
- }