Upload Youtu-LLM-2B model with LFS assets

Files changed (14) hide show

.gitattributes +7 -0
LICENSE.txt +66 -0
README.md +238 -0
assets/general_agentic_instruct.png +3 -0
assets/youtu-llm-logo.png +3 -0
chat_template.jinja +1 -0
config.json +39 -0
configuration_youtu.py +198 -0
generation_config.json +11 -0
model.safetensors +3 -0
modeling_youtu.py +610 -0
special_tokens_map.json +23 -0
tokenizer.json +3 -0
tokenizer_config.json +2064 -0

.gitattributes CHANGED Viewed

@@ -4,6 +4,7 @@
 *.bz2 filter=lfs diff=lfs merge=lfs -text
 *.ckpt filter=lfs diff=lfs merge=lfs -text
 *.ftz filter=lfs diff=lfs merge=lfs -text
 *.gz filter=lfs diff=lfs merge=lfs -text
 *.h5 filter=lfs diff=lfs merge=lfs -text
 *.joblib filter=lfs diff=lfs merge=lfs -text
@@ -33,3 +34,9 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.bz2 filter=lfs diff=lfs merge=lfs -text
 *.ckpt filter=lfs diff=lfs merge=lfs -text
 *.ftz filter=lfs diff=lfs merge=lfs -text
+*.gguf filter=lfs diff=lfs merge=lfs -text
 *.gz filter=lfs diff=lfs merge=lfs -text
 *.h5 filter=lfs diff=lfs merge=lfs -text
 *.joblib filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+*.png filter=lfs diff=lfs merge=lfs -text
+*.jpg filter=lfs diff=lfs merge=lfs -text
+*.jpeg filter=lfs diff=lfs merge=lfs -text
+*.gif filter=lfs diff=lfs merge=lfs -text
+*.svg filter=lfs diff=lfs merge=lfs -text
+tokenizer.json filter=lfs diff=lfs merge=lfs -text

LICENSE.txt ADDED Viewed

	@@ -0,0 +1,66 @@

+Tencent is pleased to support the community by making Youtu-LLM available.
+Copyright (C) 2025 Tencent. All rights reserved. Youtu-LLM IS NOT INTENDED FOR USE WITHIN THE EUROPEAN UNION.
+Youtu-LLM is licensed under the License Terms of Youtu-LLM except for the third-party components listed below, which is licensed under different terms. Youtu-LLM does not impose any additional limitations beyond what is outlined in the respective licenses of these third-party components. Users must comply with all terms and conditions of original licenses of these third-party components and must ensure that the usage of the third party components adheres to all relevant laws and regulations.
+For avoidance of doubts, Youtu-LLM refers to the inference enabling code, parameters and weights made publicly available by Tencent in accordance with the License Terms of Youtu-LLM in this repository.
+Terms of the License Terms of Youtu-LLM:
+--------------------------------------------------------------------
+TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+0. Additional Territorial Limitation
+*Youtu-LLM IS NOT INTENDED FOR USE WITHIN THE EUROPEAN UNION.*
+IN THE EVENT OF ANY CONFLICT, THIS CLAUSE SHALL PREVAIL.
+1. Definitions.
+"License" shall mean the terms and conditions for use, reproduction, and distribution as defined by Sections 1 through 9 of this document.
+"Licensor" shall mean the copyright owner or entity authorized by the copyright owner that is granting the License.
+"Legal Entity" shall mean the union of the acting entity and all other entities that control, are controlled by, or are under common control with that entity. For the purposes of this definition, "control" means (i) the power, direct or indirect, to cause the direction or management of such entity, whether by contract or otherwise, or (ii) ownership of fifty percent (50%) or more of the outstanding shares, or (iii) beneficial ownership of such entity.
+"You" (or "Your") shall mean an individual or Legal Entity exercising permissions granted by this License.
+"Source" form shall mean the preferred form for making modifications, including but not limited to software source code, documentation source, and configuration files.
+"Object" form shall mean any form resulting from mechanical transformation or translation of a Source form, including but not limited to compiled object code, generated documentation, and conversions to other media types.
+"Work" shall mean the work of authorship, whether in Source or Object form, made available under the License, as indicated by a copyright notice that is included in or attached to the work (an example is provided in the Appendix below).
+"Derivative Works" shall mean any work, whether in Source or Object form, that is based on (or derived from) the Work and for which the editorial revisions, annotations, elaborations, or other modifications represent, as a whole, an original work of authorship. For the purposes of this License, Derivative Works shall not include works that remain separable from, or merely link (or bind by name) to the interfaces of, the Work and Derivative Works thereof.
+"Contribution" shall mean any work of authorship, including the original version of the Work and any modifications or additions to that Work or Derivative Works thereof, that is intentionally submitted to Licensor for inclusion in the Work by the copyright owner or by an individual or Legal Entity authorized to submit on behalf of the copyright owner. For the purposes of this definition, "submitted" means any form of electronic, verbal, or written communication sent to the Licensor or its representatives, including but not limited to communication on electronic mailing lists, source code control systems, and issue tracking systems that are managed by, or on behalf of, the Licensor for the purpose of discussing and improving the Work, but excluding communication that is conspicuously marked or otherwise designated in writing by the copyright owner as "Not a Contribution."
+"Contributor" shall mean Licensor and any individual or Legal Entity on behalf of whom a Contribution has been received by Licensor and subsequently incorporated within the Work.
+2. Grant of Copyright License. Subject to the terms and conditions of this License, each Contributor hereby grants to You a perpetual, worldwide, non-exclusive, no-charge, royalty-free, irrevocable copyright license to reproduce, prepare Derivative Works of, publicly display, publicly perform, sublicense, and distribute the Work and such Derivative Works in Source or Object form.
+3. Grant of Patent License. Subject to the terms and conditions of this License, each Contributor hereby grants to You a perpetual, worldwide, non-exclusive, no-charge, royalty-free, irrevocable (except as stated in this section) patent license to make, have made, use, offer to sell, sell, import, and otherwise transfer the Work, where such license applies only to those patent claims licensable by such Contributor that are necessarily infringed by their Contribution(s) alone or by combination of their Contribution(s) with the Work to which such Contribution(s) was submitted. If You institute patent litigation against any entity (including a cross-claim or counterclaim in a lawsuit) alleging that the Work or a Contribution incorporated within the Work constitutes direct or contributory patent infringement, then any patent licenses granted to You under this License for that Work shall terminate as of the date such litigation is filed.
+4. Redistribution. You may reproduce and distribute copies of the Work or Derivative Works thereof in any medium, with or without modifications, and in Source or Object form, provided that You meet the following conditions:
+You must give any other recipients of the Work or Derivative Works a copy of this License; and
+You must cause any modified files to carry prominent notices stating that You changed the files; and
+You must retain, in the Source form of any Derivative Works that You distribute, all copyright, patent, trademark, and attribution notices from the Source form of the Work, excluding those notices that do not pertain to any part of the Derivative Works; and
+If the Work includes a "NOTICE" text file as part of its distribution, then any Derivative Works that You distribute must include a readable copy of the attribution notices contained within such NOTICE file, excluding those notices that do not pertain to any part of the Derivative Works, in at least one of the following places: within a NOTICE text file distributed as part of the Derivative Works; within the Source form or documentation, if provided along with the Derivative Works; or, within a display generated by the Derivative Works, if and wherever such third-party notices normally appear. The contents of the NOTICE file are for informational purposes only and do not modify the License. You may add Your own attribution notices within Derivative Works that You distribute, alongside or as an addendum to the NOTICE text from the Work, provided that such additional attribution notices cannot be construed as modifying the License.
+You may add Your own copyright statement to Your modifications and may provide additional or different license terms and conditions for use, reproduction, or distribution of Your modifications, or for any such Derivative Works as a whole, provided Your use, reproduction, and distribution of the Work otherwise complies with the conditions stated in this License.
+5. Submission of Contributions. Unless You explicitly state otherwise, any Contribution intentionally submitted for inclusion in the Work by You to the Licensor shall be under the terms and conditions of this License, without any additional terms or conditions. Notwithstanding the above, nothing herein shall supersede or modify the terms of any separate license agreement you may have executed with Licensor regarding such Contributions.
+6. Trademarks. This License does not grant permission to use the trade names, trademarks, service marks, or product names of the Licensor, except as required for reasonable and customary use in describing the origin of the Work and reproducing the content of the NOTICE file.
+7. Disclaimer of Warranty. Unless required by applicable law or agreed to in writing, Licensor provides the Work (and each Contributor provides its Contributions) on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied, including, without limitation, any warranties or conditions of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A PARTICULAR PURPOSE. You are solely responsible for determining the appropriateness of using or redistributing the Work and assume any risks associated with Your exercise of permissions under this License.
+8. Limitation of Liability. In no event and under no legal theory, whether in tort (including negligence), contract, or otherwise, unless required by applicable law (such as deliberate and grossly negligent acts) or agreed to in writing, shall any Contributor be liable to You for damages, including any direct, indirect, special, incidental, or consequential damages of any character arising as a result of this License or out of the use or inability to use the Work (including but not limited to damages for loss of goodwill, work stoppage, computer failure or malfunction, or any and all other commercial damages or losses), even if such Contributor has been advised of the possibility of such damages.
+9. Accepting Warranty or Additional Liability. While redistributing the Work or Derivative Works thereof, You may choose to offer, and charge a fee for, acceptance of support, warranty, indemnity, or other liability obligations and/or rights consistent with this License. However, in accepting such obligations, You may act only on Your own behalf and on Your sole responsibility, not on behalf of any other Contributor, and only if You agree to indemnify, defend, and hold each Contributor harmless for any liability incurred by, or claims asserted against, such Contributor by reason of your accepting any such warranty or additional liability.
+END OF TERMS AND CONDITIONS

README.md ADDED Viewed

	@@ -0,0 +1,238 @@

+---
+library_name: transformers
+license: other
+license_link: https://huggingface.co/tencent/Youtu-LLM-2B/LICENSE.txt
+pipeline_tag: text-generation
+base_model:
+  - tencent/Youtu-LLM-2B-Base
+---
+<div align="center">
+# <img src="assets/youtu-llm-logo.png" alt="Tencent Youtu Lab Logo" height="26px">
+# <img src="assets/general_agentic_instruct.png" alt="Comparison between Youtu-LLM-2B and baselines" height="260px">
+[📃 License](LICENSE.txt) • [💻 Code](https://github.com/TencentCloudADP/youtu-tip/youtu-llm) • [📑 Technical Report](https://github.com/TencentCloudADP/youtu-tip/youtu-llm/assets/Youtu-LLM_Technical_Report.pdf) • [📊 Benchmarks](#benchmarks) • [🚀 Getting Started](#quickstart) • [💡 Highlights](#highlights)
+</div>
+## 🎯 Brief Introduction
+**Youtu-LLM** is a new, small, yet powerful LLM, contains only 1.96B parameters, supports 128k long context, and has native agentic talents. On general evaluations, Youtu-LLM significantly outperforms SOTA LLMs of similar size in terms of Commonsense, STEM, Coding and Long Context capabilities; in agent-related testing, Youtu-LLM surpasses larger-sized leaders and is truly capable of completing multiple end2end agent tasks.
+**Youtu-LLM** has the following features:
+- Type: Autoregressive Causal Language Models with Dense [MLA](https://arxiv.org/abs/2405.04434)
+- Release versions: [Base](https://huggingface.co/tencent/Youtu-LLM-2B-Base) and [Instruct](https://huggingface.co/tencent/Youtu-LLM-2B)
+- Number of Parameters: 1.96B
+- Number of Layers: 32
+- Number of Attention Heads (MLA): 16 for Q/K/V
+- MLA Rank: 1,536 for Q, 512 for K/V
+- MLA Dim: 128 for QK Nope, 64 for QK Rope, and 128 for V
+- Context Length: 131,072
+- Vocabulary Size: 128,256
+<a id="benchmarks"></a>
+## 📊 Performance Comparisons
+### Instruct Model
+#### General Benchmarks
+| Benchmark | DeepSeek-R1-Distill-Qwen-1.5B | Qwen3-1.7B | SmolLM3-3B | Qwen3-4B | DeepSeek-R1-Distill-Llama-8B | Youtu-LLM-2B |
+| :--- | :---: | :---: | :---: | :---: | :---: | :---: |
+| **Commonsense Knowledge Reasoning** | | | | | | |
+| MMLU-Redux | 53.0% | 74.1% | 75.6% | **83.8%** | <u>78.1%</u> | 75.8% |
+| MMLU-Pro | 36.5% | 54.9% | 53.0% | **69.1%** | 57.5% | <u>61.6%</u> |
+| **Instruction Following & Text Reasoning** | | | | | | |
+| IFEval | 29.4% | 70.4% | 60.4% | **83.6%** | 34.6% | <u>81.2%</u> |
+| DROP | 41.3% | 72.5% | 72.0% | <u>82.9%<u> | 73.1% | **86.7%** |
+| MUSR | 43.8% | 56.6% | 54.1% | **60.5%** | <u>59.7%</u> | 57.4% |
+| **STEM** | | | | | | |
+| MATH-500 | 84.8% | 89.8% | 91.8% | **95.0%** | 90.8% | <u>93.7%</u> |
+| AIME 24 | 30.2% | 44.2% | 46.7% | **73.3%** | 52.5% | <u>65.4%</u> |
+| AIME 25 | 23.1% | 37.1% | 34.2% | **64.2%** | 34.4% | <u>49.8%</u> |
+| GPQA-Diamond | 33.6% | 36.9% | 43.8% | **55.2%** | 45.5% | <u>48.0%</u> |
+| BBH | 31.0% | 69.1% | 76.3% | **87.8%** | <u>77.8%</u> | 77.5% |
+| **Coding** | | | | | | |
+| HumanEval | 64.0% | 84.8% | 79.9% | <u>95.4%<u> | 88.1% | **95.9%** |
+| HumanEval+ | 59.5% | 76.2% | 74.7% | <u>87.8%</u> | 82.5% | **89.0%** |
+| MBPP | 51.5% | 80.5% | 66.7% | **92.3%** | 73.9% | <u>85.0%</u> |
+| MBPP+ | 44.2% | 67.7% | 56.7% | **77.6%** | 61.0% | <u>71.7%</u> |
+| LiveCodeBench v6 | 19.8% | 30.7% | 30.8% | **48.5%** | 36.8% | <u>43.7%</u> |
+#### Agentic Benchmarks
+| Benchmark | Qwen3-1.7B | SmolLM3-3B | Qwen3-4B | Youtu-LLM-2B |
+| :--- | :---: | :---: | :---: | :---: |
+| **Deep Research** | | | | |
+| GAIA | 11.4% | 11.7% | <u>25.5%</u> | **33.9%** |
+| xbench | 11.7% | 13.9% | <u>18.4%</u> | **19.5%** |
+| **Code** | | | | |
+| SWE-Bench-Verified | 0.6% | <u>7.2%</u> | 5.7% | **17.7%** |
+| EnConda-Bench | 10.8% | 3.5% | <u>16.1%</u> | **21.5%** |
+| **Tool** | | | | |
+| BFCL V3 | 55.5% | 31.5% | **61.7%** | <u>58.0%</u> |
+| τ²-Bench | 2.6% | 9.7% | <u>10.9%</u> | **15.0%** |
+<a id="quickstart"></a>
+## 🚀 Quick Start
+This guide will help you quickly deploy and invoke the **Youtu-LLM-2B** model. This model supports "Reasoning Mode", enabling it to generate higher-quality responses through Chain of Thought (CoT).
+---
+### 1. Environment Preparation
+Ensure your Python environment has the `transformers` library installed and that the version meets the requirements.
+```bash
+pip install "transformers>=4.56" torch accelerate
+```
+---
+### 2. Core Code Example
+The following example demonstrates how to load the model, enable Reasoning Mode, and use the `re` module to parse the "Thought Process" and the "Final Answer" from the output.
+```python
+import re
+import torch
+from transformers import AutoTokenizer, AutoModelForCausalLM
+# 1. Configure Model
+model_id = "tencent/Youtu-LLM-2B"
+# 2. Initialize Tokenizer and Model
+tokenizer = AutoTokenizer.from_pretrained(model_id, trust_remote_code=True)
+model = AutoModelForCausalLM.from_pretrained(
+    model_id,
+    device_map="auto",
+    trust_remote_code=True
+)
+# 3. Construct Dialogue Input
+prompt = "Hello"
+messages = [{"role": "user", "content": prompt}]
+# Use apply_chat_template to construct input; set enable_thinking=True to activate Reasoning Mode
+input_ids = tokenizer.apply_chat_template(
+    messages,
+    tokenize=True,
+    add_generation_prompt=True,
+    return_tensors="pt",
+    enable_thinking=True
+).to(model.device)
+# 4. Generate Response
+outputs = model.generate(
+    input_ids,
+    max_new_tokens=512,
+    do_sample=True,
+    temperature=1.0,
+    top_p=0.95,
+    repetition_penalty=1.05
+)
+# 5. Parse Results
+full_response = tokenizer.decode(outputs[0], skip_special_tokens=True)
+def parse_reasoning(text):
+    """Extract thought process within <think> tags and the subsequent answer content"""
+    thought_pattern = r"<think>(.*?)</think>"
+    match = re.search(thought_pattern, text, re.DOTALL)
+    if match:
+        thought = match.group(1).strip()
+        answer = text.split("</think>")[-1].strip()
+    else:
+        thought = "(No explicit thought process generated)"
+        answer = text
+    return thought, answer
+thought, final_answer = parse_reasoning(full_response)
+print(f"\n{'='*20} Thought Process {'='*20}\n{thought}")
+print(f"\n{'='*20} Final Answer {'='*20}\n{final_answer}")
+```
+---
+### 3. Key Configuration Details
+#### Reasoning Mode Toggle
+Controlled via the `enable_thinking` parameter in the `apply_chat_template` method:
+* **True (Recommended Default):** Activates Chain of Thought; ideal for complex logic and reasoning tasks.
+* **False:** Outputs results directly; faster response time, suitable for simple conversations.
+#### Recommended Decoding Parameters
+Depending on your use case, we suggest adjusting the following hyperparameters for optimal generation:
+| Parameter | Reasoning Mode | Normal Mode |
+| --- | --- | --- |
+| `do_sample` | `True` | `True` |
+| `temperature` | **1.0** (Maintains creativity) | **0.7** (More stable results) |
+| `top_p` | 0.95 | 0.8 |
+| `top_k` | 20 | 20 |
+| `repetition_penalty` | 1.05 | - |
+> **Tip:** When using Reasoning Mode, a higher `temperature` helps the model perform deeper, more divergent thinking.
+---
+### 4. vLLM Deployment
+We provide support for deploying the model using **vLLM 0.10.2**. The recommended Docker image is `vllm/vllm-openai:v0.10.2`.
+#### Integration Steps
+First, execute the following commands to integrate the Youtu-LLM model files into the vLLM framework.
+*Note: Please extract our provided [modified vllm zip file](https://github.com/TencentCloudADP/youtu-tip/youtu-llm/vllm_deploy/modified_vllm.zip) first. Then, replace `<local_modified_vllm_path>` with the path to the extracted vllm directory, and replace `<vllm_path>` with the installation path of vLLM.*
+```bash
+cp <local_modified_vllm_path>/0_10_2_official/youtu_llm.py <vllm_path>/vllm/model_executor/models/youtu_llm.py
+cp <local_modified_vllm_path>/0_10_2_official/configuration_youtu.py <vllm_path>/vllm/model_executor/models/configuration_youtu.py
+cp <local_modified_vllm_path>/0_10_2_official/__init__.py <vllm_path>/vllm/config/__init__.py
+cp <local_modified_vllm_path>/0_10_2_official/registry.py <vllm_path>/vllm/model_executor/models/registry.py
+```
+#### Service Startup
+Once integrated, you can deploy the model using the following command:
+```bash
+vllm serve <model_path> --trust-remote-code
+```
+**Tool Call Support:**
+To enable tool calling capabilities, please append the following arguments to the startup command:
+```bash
+--enable-auto-tool-choice --tool-call-parser hermes
+```
+---
+<a id="highlights"></a>
+## 💡 Highlights
+### Showcase of General Tasks
+| User's query | Youtu-LLM-2B's response |
+|---------|---------|
+| 根据《个人信息保护法》，以下哪种措施是处理个人信息时必须遵循的原则以保护用户隐私权？<br>A:数据加密，确保个人信息在传输和存储时的安全<br>B:尽可能收集和保存用户的全部信息，以便提供更个性化的服务<br>C:公开所有收集的个人信息，让用户自行决定是否接受<br>D:未经用户同意，将个人信息转移给第三方 | 根据《个人信息保护法》的相关规定，处理个人信息时必须遵循的原则以保护用户隐私权，需结合法律的具体条款进行分析。<br>---<br>### **选项分析**<br>**A. 数据加密，确保个人信息在传输和存储时的安全**  <br>《个人信息保护法》第二十一条明确规定：“处理者应当采取技术措施和其他必要措施，确保其处理的个人信息安全，防止个人信息泄露、篡改、丢失。”  <br>数据加密是实现安全保障的重要技术手段，属于法律要求的**具体措施**，但其本质是落实“安全保障义务”这一原则。虽然“安全保障义务”是法律原则之一，但“数据加密”本身是该原则下的**具体操作手段**。  <br>**结论**：该选项符合法律对个人信息安全的强制性要求，是保护用户隐私权的重要措施。<br>**B. 尽可能收集和保存用户的全部信息，以便提供更个性化的服务**  <br>《个人信息保护法》第十五条明确规��：“处理个人信息应当具有明确、合理的目的，并应当与处理目的直接相关，采取对个人权益影响最小的方式。”  <br>“最小必要原则”是法律的核心原则之一，要求**仅收集与处理目的直接相关的信息**，而非“尽可能收集和保存全部信息”。  <br>**结论**：该选项明显违反“最小必要原则”，属于错误做法。<br>**C. 公开所有收集的个人信息，让用户自行决定是否接受**  <br>《个人信息保护法》第十四条规定：“处理个人信息应当公开处理规则，明示处理目的、方式及范围。”  <br>法律要求的是**公开处理规则**，而非“公开所有个人信息”。用户有权了解其信息被如何使用，但“公开所有信息”并非法定要求，且可能涉及过度收集。  <br>**结论**：该选项表述不准确，不符合法律规定。<br>**D. 未经用户同意，将个人信息转移给第三方**  <br>《个人信息保护法》第十条明确规定：“处理个人信息应当取得个人同意；法律、行政法规另有规定的除外。”  <br>未经用户同意转移个人信息属于违法行为，严重侵犯用户隐私权。  <br>**结论**：该选项明显违反法律，属于错误做法。<br>---<br>### **核心原则与选项对应**<br>《个人信息保护法》的核心原则包括：  <br>1. **合法、正当、必要、诚信原则**（第十三条、第十四条）  <br>2. **最小必要原则**（第十五条）  <br>3. **公开透明原则**（第十四条）  <br>4. **安全保障义务**（第二十一条）  <br>其中，**安全保障义务**要求处理者采取必要措施保障个人信息安全，包括数据加密等具体技术手段。因此，**数据加密是落实安全保障义务的必要措施**，属于法律明确要求的实践操作。<br>---<br>### **结论**<br>在四个选项中，**只有A项符合《个人信息保护法》对个人信息处理的要求**，是保护用户隐私权必须遵循的措施。其他选项均存在明显违法或与法律原则相悖的问题。<br>**正确答案：A** |
+| 设总体\$X\$的分布律为<br>\begin{tabular}{\|l\|l\|l\|l\|}<br>\hline\$X\$&-1&0&2\\<br>\hline\$P\$&\$\frac{1}{3}\theta\$&\$1-\frac{2}{3}\theta\$&\$\frac{1}{3}\theta\$\\<br>\hline<br>\end{tabular}<br>\$\left(X_{1},X_{2},\cdots,X_{n}\right)\$为来自总体的样本,设有以下四个统计量<br>(i)\$\frac{3}{n}\sum_{i=1}^{n}X_{i}\$,(ii)\$\left.X_{1}+\frac{2}{n-1}\right)_{i=2}^{n}X_{i}\$,(iii)\$\frac{3}{5n}\sum_{i=1}^{n}X_{i}^{2}\$,(iv)\$\frac{1}{3n}\sum_{i=1}^{n}X_{i}^{2}\$<br>在上述四个统计量中,是参数\$\theta\$的一致估计量的个数是____<br>A:0<br>B:2<br>C:1<br>D:3 | ### 题目分析<br>我们被给出一个总体 \$ X \$ 的分布律如下：<br>\$\$<br>\begin{array}{\|l\|l\|l\|}<br>\hline<br>X & -1 & 0 & 2 \\<br>\hline<br>P & \frac{1}{3}\theta & 1 - \frac{2}{3}\theta & \frac{1}{3}\theta \\<br>\hline<br>\end{array}<br>\$\$<br>其中 \$\theta \in [0, \frac{3}{2}]\$，因为所有概率必须非负。<br>样本 \$(X_1, X_2, \ldots, X_n)\$ 来自该总体，题目要求判断以下四个统计量中哪些是参数 \$\theta\$ 的**一致估计量**。<br>---<br>### 一致估计量的定义<br>一个估计量 \$\hat{\theta}^{(n)}\$ 是参数 \$\theta\$ 的**一致估计量**，当且仅当：<br>\$\$<br>\lim_{n \to \infty} P(\|\hat{\theta}^{(n)} - \theta\| > \varepsilon) = 0 \quad \text{对任意 } \varepsilon > 0<br>\$\$<br>即：随着样本容量 \$n\$ 增大，估计量依概率收敛于真实参数 \$\theta\$。<br>通常，若估计量是**渐近无偏**的（即 \$E[\hat{\theta}^{(n)}] \to \theta\$）且满足一致方差条件，则它是一致估计量。但即使不满足这些条件，只要依概率收敛即可。<br>---<br>### 计算关键期望值<br>我们先计算一些关键矩：<br>- \$ E[X] = (-1)\cdot \frac{1}{3}\theta + 0 \cdot \left(1 - \frac{2}{3}\theta\right) + 2 \cdot \frac{1}{3}\theta = \frac{1}{3}\theta \$<br>- \$ E[X^2] = 1 \cdot \frac{1}{3}\theta + 0 + 4 \cdot \frac{1}{3}\theta = \frac{5}{3}\theta \$<br>---<br>### 逐个分析统计量<br>#### (i) \$\frac{3}{n} \sum_{i=1}^{n} X_i\$<br>- 期望：  <br>  \$\$<br>  E\left[\frac{3}{n} \sum_{i=1}^{n} X_i\right] = \frac{3}{n} \cdot n \cdot E[X] = 3 \cdot \frac{1}{3}\theta = \theta<br>  \$\$<br>- 由大数定律，\$\frac{1}{n} \sum_{i=1}^{n} X_i \xrightarrow{P} E[X] = \frac{1}{3}\theta\$，  <br>  所以 \$\frac{3}{n} \sum_{i=1}^{n} X_i \xrightarrow{P} \theta\$<br>✅ **结论：(i) 是一致估计量**<br>---<br>#### (ii) \$X_1 + \frac{2}{n-1} \sum_{i=2}^{n} X_i\$<br>- 表达式可写为：<br>  \$\$<br>  \hat{\theta}^{(ii)} = X_1 + \frac{2}{n-1} \sum_{i=2}^{n} X_i<br>  \$\$<br>- 期望：<br>  \$\$<br>  E[\hat{\theta}^{(ii)}] = E[X_1] + \frac{2}{n-1} \cdot (n-1) E[X] = \frac{1}{3}\theta + 2 \cdot \frac{1}{3}\theta = \theta<br>  \$\$<br>- 但注意：该统计量包含 \$X_1\$，这是一个**固定随机变量**，而 \$\frac{2}{n-1} \sum_{i=2}^{n} X_i \xrightarrow{P} \frac{2}{3}\theta\$，  <br>  所以整��趋于 \$X_1 + \frac{2}{3}\theta\$，而 \$X_1\$ 不是 \$\theta\$ 的函数，因此极限不唯一。<br>❌ **结论：(ii) 不是一致估计量**<br>---<br>#### (iii) \$\frac{3}{5n} \sum_{i=1}^{n} X_i^2\$<br>- 期望：<br>  \$\$<br>  E\left[\frac{3}{5n} \sum_{i=1}^{n} X_i^2\right] = \frac{3}{5n} \cdot n \cdot E[X^2] = \frac{3}{5} \cdot \frac{5}{3}\theta = \theta<br>  \$\$<br>- 由大数定律，\$\frac{1}{n} \sum_{i=1}^{n} X_i^2 \xrightarrow{P} E[X^2] = \frac{5}{3}\theta\$，  <br>  所以 \$\frac{3}{5n} \sum_{i=1}^{n} X_i^2 \xrightarrow{P} \theta\$<br>✅ **结论：(iii) 是一致估计量**<br>---<br>#### (iv) \$\frac{1}{3n} \sum_{i=1}^{n} X_i^2\$<br>- 期望：<br>  \$\$<br>  E\left[\frac{1}{3n} \sum_{i=1}^{n} X_i^2\right] = \frac{1}{3n} \cdot n \cdot E[X^2] = \frac{1}{3} \cdot \frac{5}{3}\theta = \frac{5}{9}\theta \neq \theta<br>  \$\$<br>- 极限为 \$\frac{5}{9}\theta \neq \theta\$，故不依概率收敛于 \$\theta\$<br>❌ **结论：(iv) 不是一致估计量**<br>---<br>### 最终结论<br>- 一致估计量有：(i) 和 (iii)<br>- 共 **2 个**<br>---<br>### 答案<br>\$\$<br>\boxed{B}<br>\$\$ |
+| Which of the following statements does NOT accurately describe voting behavior in the United States?<br>A: Registered voters between the ages of 35 and 45 are more likely to vote than are those under the age of 21.<br>B: A registered voter who has attained his or her General Educational Development (GED) is less likely to vote than a high school dropout.<br>C: Registered voters are more likely to vote in general elections than they are in primary elections.<br>D: More women than men have voted in every presidential election since 1980. | The question asks which statement does NOT accurately describe voting behavior in the United States. Here's the analysis of each option:<br>- **Option A** states that registered voters aged 35–45 are more likely to vote than those under 21. This aligns with the general trend of increasing voter turnout with age, especially in the 30s and 40s. While younger voters (e.g., under 21) may have lower turnout, this statement is accurate.  <br>- **Option B** claims that a registered voter with a GED is less likely to vote than a high school dropout. This contradicts the typical correlation between higher education and increased voter participation. GED holders generally have higher turnout than those with less education, making this statement **inaccurate**.  <br>- **Option C** notes that registered voters are more likely to vote in general elections than primary elections. This is correct, as primaries are party-specific and often serve as a gateway to general elections, meaning registered voters are more likely to participate in the latter.  <br>- **Option D** asserts that more women than men have voted in every presidential election since 1980. Historical data shows women have consistently had slightly higher turnout rates than men in presidential elections since 1980, making this statement accurate.  <br>The incorrect statement is **B**, as it misrepresents the relationship between education and voting behavior.  <br>\boxed{B} |
+| Let \$T\$ be the set of all triples \$(a,b,c)\$ of positive integers for which there exist triangles with side lengths \$a,\$ \$b,\$ \$c.\$  Compute<br>\[\sum_{(a,b,c) \in T} \frac{2^a}{3^b 5^c}.\] | To solve the problem, we need to compute the sum over all triples \((a, b, c)\) of positive integers that form a valid triangle of the term \(\frac{2^a}{3^b 5^c}\). The set \(T\) consists of all such triples where \(a + b > c\), \(a + c > b\), and \(b + c > a\).<br>First, we express the sum as a double sum over \(a\) and \(b\), with the inner sum over \(c\) constrained by the triangle inequalities. For each \(a\) and \(b\), the valid \(c\) values are \(\|a - b\| + 1\) to \(a + b - 1\). The inner sum over \(c\) is a geometric series:<br>\[<br>\sum_{c=\|a - b\| + 1}^{a + b - 1} \frac{1}{5^c} = \frac{5}{4} \left( \frac{1}{5^{\|a - b\| + 1}} - \frac{1}{5^{a + b}} \right)<br>\]<br>Substituting this back into the original sum, we split it into two parts:<br>\[<br>\frac{5}{4} \left( \sum_{a=1}^\infty \sum_{b=1}^\infty \frac{2^a}{3^b} \left( \frac{1}{5^{\|a - b\| + 1}} - \frac{1}{5^{a + b}} \right) \right)<br>\]<br>We compute these sums separately. Let \(S_1\) be the first part and \(S_2\) be the second part.<br>For \(S_2\):<br>\[<br>S_2 = \sum_{a=1}^\infty \sum_{b=1}^\infty \frac{2^a}{3^b 5^{a + b}} = \left( \sum_{a=1}^\infty \left( \frac{2}{5} \right)^a \right) \left( \sum_{b=1}^\infty \left( \frac{1}{15} \right)^b \right) = \frac{2/3}{1 - 2/5} \cdot \frac{1/15}{1 - 1/15} = \frac{2}{3} \cdot \frac{1}{14} = \frac{1}{21}<br>\]<br>For \(S_1\), we split it into two cases \(a \geq b\) and \(a < b\). For \(a \geq b\):<br>\[<br>S_{1a} = \sum_{b=1}^\infty \sum_{k=0}^\infty \frac{2^{b + k}}{3^b 5^{k + 1}} = \frac{2}{3} \sum_{b=1}^\infty \left( \frac{2}{3} \right)^b \cdot \frac{1}{5} \sum_{k=0}^\infty \left( \frac{2}{5} \right)^k = \frac{2}{3} \cdot \frac{1}{3} \cdot 2 = \frac{2}{3}<br>\]<br>For \(a < b\):<br>\[<br>S_{1b} = \sum_{a=1}^\infty \sum_{m=1}^\infty \frac{2^a}{3^{a + m} 5^{m + 1}} = \frac{1}{5 \cdot 14} \sum_{a=1}^\infty \left( \frac{2}{3} \right)^a = \frac{1}{70} \cdot 2 = \frac{1}{35}<br>\]<br>Thus, \(S_1 = S_{1a} + S_{1b} = \frac{2}{3} + \frac{1}{35} = \frac{73}{105}\).<br>Combining these results:<br>\[<br>\frac{5}{4} \left( \frac{73}{105} - \frac{1}{21} \right) = \frac{5}{4} \left( \frac{73}{105} - \frac{5}{105} \right) = \frac{5}{4} \cdot \frac{68}{105} = \frac{17}{21}<br>\]<br>The final answer is:<br>\[<br>\boxed{\dfrac{17}{21}}<br>\] |
+### Showcase of Specialized Tasks
+| Task | User's query | Youtu-LLM-2B's response |
+|---------|---------|---------|
+| **问题改写✍️** | Q1：南京欢乐谷的具体地址是哪里<br>A1：南京市欢乐谷景区（Nanjing Happy Valley），位于江苏省南京市栖霞区经济技术开发区欢乐谷北路8号。<br>Q2：现在适合去旅游吗<br>A2：旅游的适宜性取决于多个因素，包括目的地的疫情状况、旅行限制和个人的健康状况。由于我无法获取实时信息，建议你参考当地政府和卫生部门的指导，以了解目的地的旅行建议和限制。<br>Q3：南京欢乐谷和北京欢乐谷哪个好玩<br>A3：南京欢乐谷和北京欢乐谷都是知名的主题公园，各自都有其独特的魅力和特色。以下是一些比较它们的方面:<br>1. 规模和设施：北京欢乐谷是中国最大的主题公园之一，拥有广阔的面积和丰富多样的游乐设施。南京欢乐谷也是一座大型主题公园，虽然规模较小，但同样提供了多种娱乐项目和设施。<br>2. 地理位置：北京欢乐谷位于中国首都北京，周边有许多其他旅游景点和文化遗址，可以更方便地探索城市的其他景点。南京欢乐谷则位于江苏省南京市，周边也有一些历史和文化景点。<br>3. 主题和氛围：北京欢乐谷以欢乐、刺激和冒险为主题，有许多惊险刺激的游乐设施。南京欢乐谷则更注重家庭娱乐和亲子活动，提供了更多适合全家人一起玩乐的项目。<br>根据以上已知条件和问答内容，理解以下问题意图，并将问题以完整的形式输出<br>Q4：详细解释下第三点 | 详细解释下南京欢乐谷和北京欢乐谷比较中，主题和氛围的部分。 |
+| **文本切分📋** | 脉冲电子围栏报警系统中文LCD控制键盘使用手册V1.0<br>第一章:脉冲电子围栏入侵报警系统简介<br>尊敬的客户:<br>您好!感谢您使用本公司产品，为了更好更快的安装及使用本产品，请在使用前认真仔细地阅读本手册。<br>脉冲电子围栏系统包括脉冲电子围栏主机以及对其控制的PC主机、中文LCD液晶键盘，本手册针对脉冲电子围栏中文LCD控制键盘适用，如是您有任问技术问题或需要技术支持，请联系我公司，我公司将竭力为您服务。<br>一、脉冲电子围栏主机概述<br>1.1绝对安全，根据GB/T7946-2008要求研发制造，并通过了公安部的形式检验。<br>1.2误报率低和适应性强<br>智能型脉冲电子围栏系统基本不受环境(如树木、小动物、震动等)和气候(如风、雪、雨、雾等)的<br>影响，不受地形高低和曲折程度的限制，误报率极低。<br>1.3阻挡和报警双重功能<br>智能型脉冲电子围栏系统的新概念是把企图入侵者阻挡在防区之外，不作案为目的。<br>能够实实在在给入<br>侵者一种威慑感和阻挡作用，使其不敢轻举妄动，达到防范为主，减少作案次数。<br>1.4连续工作、布防/撤防，按需设定。<br>1.6可根据用户要求和现场地理环境以及安全等级进行设计和安装。<br>并可和多种现代安防产品，例如电视监控系统、安防报警系统配套使用，以提高系统的安全防范等级。<br>1.7绝对安全及报警感知性<br>传统的高压脉冲电网警戒系统没有报警感知功能，仅仅以高压、大电流的方式阻止入侵者，极易造成入<br>侵者伤残，甚至死亡等严重后果。<br>智能型脉冲电子围栏系统采用了低能量的脉冲高压(5\~10KV)。<br>由于能量<br>极低且作用时间极为短暂，因而对人体不会造成伤害。<br>一旦触及，也会因直接有触电感而离开。<br>二、中文LCD控制键盘特点及性能参数<br>功能特点:<br>1.可接128台脉冲电子围栏，中文液晶显示，两路RS485总线通讯接口，方便现场安装施工;<br>2.采用中文液晶显示，显示直观，操作方便<br>3.可同时远程控制128台高压脉冲围栏控制器<br>4.可以实时显示和控制各围栏控制器的状态(脉冲电压幅值、布防/撤防状态)<br>5.报警时显示对应防区的报警类型(防拆、短路、断线、短接)，同时有声音提示<br>6.一键布/撤防功能<br>7.可以查询报警历史记录.<br>8.可以实时显示线上电压<br>9.可查询操作记录防止管理人员对系统乱撤防等;<br>10.可控制前端继电器模块输出信号;<br>11.支持遥控器高，低压布防，撤防，复位等;<br>12.六个LED指示灯显示系��工作状态;<br>13.自带一路12V800MA电压报警输出及一路常开常闭信号可选输出;<br>14.可存储100条报警记录，及100条操作记录;<br>技术参数:<br>尺寸(长x宽x厚):19.5x14x2.9cm<br>重量:250克<br>工作环境:-20℃ +50℃;-0-85%湿度<br>工作电压:直流:12伏\~16伏<br>工作电流(直流):静态50毫安;报警100毫安<br>中文液晶显示，显示控制设备的各类信息，包括报警、状态等。<br>第二章:中文LCD控制键盘说明<br>一.中文LCD控制键盘面板示意图:<br>(中文LCD控制键盘图)<br>图片占位符<br>1.正常有电状态时，电源指示灯亮<br>2.系统运行时，运行指示灯亮<br>3.键盘布防时，布防指示灯亮<br>4.系统有报警时，报警指示灯亮<br>5.有无线遥控器的控制信号时，信号指示灯亮<br>二.接线端口<br>1.RS485通讯口2:键盘第二二路485 通讯接口;<br>2.RS485通讯口1:键盘第一路485通讯接口;<br>3. 12V， GND:为键盘12V供电接入口;<br>4.开关量:键盘报警开关量输出接口(常开，常闭可选，在键盘内部继电器旁的JP跳针);<br>5.警号输出接口:"+"接警号正极，"一"接警号负极;<br>(接线端口示意图)<br>图片占位符<br>第三章:编程设置<br>注:系统初始密码为:8888;安装调试完成后，请第一时间修改系统密码!<br>一.系统菜单项及编程设置<br>1.1系统上电初始化界面，显示公司名称及欢迎界面:<br>图片占位符<br>(欢迎使用界面)<br>1.2 报警信息显示界面及防区状态循环界面:<br>(防区状态循环界面)<br>图片占位符<br>图片占位符<br>(报警信息显示界面)<br>在此两界面下，按"↑""↓"键可来回切换;在报警界面下，Alarm:后面的数字表示当前的防区报警数量;All:后面的数字表示系统总共防区数量。<br>1.3系统功能参数设置:<br>按下键盘上的"菜单"键后，可调出进入至"设置系统参数"主界面;如下图:<br>图片占位符<br>此时光标条产生背景对比度，以示当时选定的菜单项;此时按下"确定"键后，提示输入密码:输入完密码后即可进入到"设置系统参数"的二级菜单页;如下图:<br>图片占位符<br>(输入密码界面，密码为4位，输入正确后自动进入二级菜单)<br>图片占位符<br>(设置系统参数二级菜单界面)<br>1.4防区设置(增加/删除防区)<br>在"设置系统参数"菜单下，通过按"↓"键，选中"防区设置"后，按"确定"键进入菜单;如下图:<br>图片占位符<br>(防区设置界面)<br>态;<br>1.4.1增加防区<br>***,按"确定"键后即可增加相应编号的防区，反复操作即可增加更多的防区;如下图:<br>图片占位符<br>(增加防区界面)<br>1.4.2删除防区<br>在"防区设置界面"通过"↑""↓"键选中预删除的防区号，按一下键盘上的"删除"键后，弹出删除提示菜单后，按键盘上的"确定"键后即可删除当前防区;如下图:<br>图片占位符<br>(删除防区界面)<br>1.5快速布撤防操作<br>在"设置系统参数"菜单下，通过按"↓"键，选择"快速布撤防操作"后，按下"确定"键后进入至"快速布撤防操作"菜单，此时再通过"↑""↓"键选中预对围栏系统进行的操作后按下"确定"键即可;如下图:<br>图片占位符<br>(快速布撤防界面)<br>1.6单防区操作<br>在"设置系统参数"菜单下，通过"↑""↓"键选择"单防区操作"后，按下"确定"键后进入至"单防区操作"菜单，如下图:<br>图片占位符<br>(单防区操作界面)<br>在"单防区操作"界面，通过"↑""↓"键定位光标，输入预单防区操作的防区号:10(假设值)，然后按"↓"键将光标下移到电压设置行:(按"2"为高压，"1"为低压);再按"↓"键将光标下移到设置状态行:(按"0"为撤防，"1"为布防)，再按"确定"键即可对前端对应防区号的围栏主机进行相应的操作。<br>1.7定时布撤防设置<br>在"设置系统参数"菜单下，通过""键选择"定时布撤防设置"后，按下"确定"键后进入至"定时布撤防设置"菜单，如下图:<br>图片占位符<br>(定时布撤防设置界面)<br>通过"↑""↓"键可移动光标，输入预计的时间段;移至时间段最未端时，通过按下"0/1/2/3"键设置该时间段要进行的定时操作("0"=不操作，"1"=高压布防，"2"=低压布防，"3"=撤防);<br>1.8触发时间设置<br>在"设置系统参数"菜单下，通过"↑""↓"键选择"触发时间设置"后，按下"确定"键后进入至"触发时间设置"菜单，如下图:<br>图片占位符<br>(触发时间设置界面)<br>输入需设置围栏主机报警触发的时间参数(以秒为单位，最大3位数)后按下"确定"键即可，按"取消"键可退格时间参数重新输入时间。<br>1.9报警时间设置<br>在"设置系统参数"菜单下，通过"键选择"报警时间设置"后，按下"确定"键后进入至"报警时间设置"菜单，如下图:<br>图片占位符<br>(报警时间设置界面)<br>输入需设置围栏主机及中文LCD控制键盘报警的时间参数(以���为单位，最大3位数)后按下"确定"键即可，按"取消"键可退格时间参数重新输入时间。<br>报警时间参数即为前端每台围栏主机的报警后自动<br>恢复的时间值及中文控制键盘的报警时间。<br>1.10防区号设置<br>在"设置系统参数"菜单下，通过"↑""↓"键选择"防区号设置"后，按下"确定"键后进入至"防区号设置"菜单，如下图:<br>图片占位符<br>(防区号设置界面)<br>通过"↑""↓"键移光标，输入旧防区号及新防区号后，按下"确定"即可将前端围栏主机的旧防区号改成新的防区号(注:假设前端围栏主机的防区号为"1"，要改成新的防区号为"2"，此时在此界面旧防区号输入:1，新防区号输入:2，确定完后，原先防区号为"1"的围栏主机就变成了防区号为"2")。<br>1.11键盘模式设置<br>在"设置系统参数"菜单下，通过"↑键选择"键盘模式设置"后，按下"确定"键后进入至"键盘模式设置"菜单，如下图:<br>图片占位符<br>(键盘模式设置界面)<br>通过"↑""↓"键移光标，输入键盘的编号:后按下"确定"键光标移动至键盘模式行，按下"0"表示将此键盘设置为从键盘模式，按下"1"表示将此键盘设置为主键盘模式(注:"0"=从键盘，"1"=主键盘，从键盘只能显示防区状态及防区报警信息，不能对整个系统进行布防，撤防等操作);<br>1.12时间设置<br>在"设置系统参数"菜单下，通过按"↑""↓"键选择"时间设置"后，按下"确定"键后进入至"时间设置"菜单，如下图:<br>图片占位符<br>(时间设置界面)<br>通过按"↑""↓"键移动光标，输入相应的时间年，月，日，小时，分钟后，按下"确定"键，设置时间完毕。<br>1.13密码设置<br>在"设置系统参数"菜单下，通过按"↑""↓"键选择"密码设置"后，按下"确定"键后进入至"密码设置"菜单，如下图:<br>图片占位符<br>(密码设置界面)<br>输入新的4位密码:\*\*\*\*，，输错密码值时，可按"取消"键退格删除数字以重新输入新的密码，再按"确定"键完成密码的修改;<br>1.14恢复出厂时设置<br>在"设置系统参数"菜单下，通过按"↑""↓"键选择"恢复出厂时设置"后，按下"确定"键后进入至"恢复出厂时设置"菜单，如下图:<br>图片占位符<br>(恢复出厂时设置界面)<br>注:按下"确定"键即可将键盘的所有参数恢复至出厂默认参数;请在厂家的指导下谨慎操作!<br>1.15删除报警记录<br>在主菜单下，通过按"↑""↓"键选择"删除报警记录"后，按下"确定"键后提示输入密码:\*\*\*\* ,输入正确密码后，进入至"确定删除所有记录?"界面，按下"确定"键后，删除成功同时提示"无更多记录";如下图:<br>图片占位符<br>1.16删除操作记录<br>(删除记录确定界面)<br>在主菜单下，通过按"↑""↓"键选择"删除操作记录"后，按下"确定"键后提示输入密码:\*\*\*\*，输入正确密码后，进入至"确定删除所有记录?"界面，按下"确定"键后，删除成功同时提示"无更多记录";如下图:<br>图片占位符<br>(删除记录确定界面)<br>第四章:系统日常操作<br> 注:系统初始密码为:8888;安装调试完成后，请第一时间修改系统密码!<br>一.快速高低压布防<br>在系统"防区状态循环界面"或者"报警信息显示界面"下，如果系统当前菜单页不在此两界面下时，可通过按"菜单"键来切换至"防区状态循环界面"和"报警信息显示界面";然后按"布防"键后，提示输入密码:\*\*\*\*即可进入"快速布防"菜单页;此时通过按"↑""↓"键选中需要进行"快速高压布防"或者"快速低压布防"后，按下"确定"键即可对整个系统进行相应的高压/低压布防操作;如下图:<br>图片占位符<br>二.快速撤防<br>(快速布防界面)<br>在系统"防区状态循环界面"或者"报警信息显示界面"下，如果系统当前菜单页不在此两界面下时，可通过按"菜单"键来切换至"防区状态循环"界面和"报警信息显示"界面;然后按"撤防"键后，提示输入密码:\*\*\*\*即可进入至"快速撤防"菜单页;按下"确定"键即可对整个系统进行相应的撤防操作;如下图:<br>图片占位符<br>三.报警复位<br>(快速撤防界面)<br>当系统前端有围栏主机或者地址模块防区被触发时，键盘自动切换到"报警信息显示"界面，如下图:<br>"报警信息显示"显示了当前的报警防区数量，及报警的触发条件(防拆，短路，断线，短接，模块防区报警);在报警触发时，键盘产生报警输出，同时前端围栏主机输出12V电压信号和开关量信号，此时按下"复位"键后，键盘报警恢复正常，同时前端围栏主机也恢复正常状态;且LCD控制键盘界面显示"当前无报警防区";如下图:<br>图片占位符<br>四:无线遥控器快速操作<br>下图:随金可以过过出厂围置药4继无线境的网时隔统进行"南打用用中限，围际，发位"���作:<br>图片占位符<br>五:报警记录查询<br>按下"菜单"键，让键盘切换到一级主菜下，通过"↑""↓"键选中"报警记录查询"即可进入报警查询菜单，此时显示当前最新一条报警的信息，可通过"↑""↓"键一条一条的查询;如下图:<br>图片占位符 | 脉冲电子围栏报警系统中文LCD控制键盘使用手册V1.0<br><span style="color: #3498db;">`#` </span>第一章:脉冲电子围栏入侵报警系统简介<br><span style="color: #3498db;">`##` </span>尊敬的客户:<br>您好!感谢您使用本公司产品，为了更好更快的安装及使用本产品，请在使用前认真仔细地阅读本手册。<br>脉冲电子围栏系统包括脉冲电子围栏主机以及对其控制的PC主机、中文LCD液晶键盘，本手册针对脉冲电子围栏中文LCD控制键盘适用，如是您有任问技术问题或需要技术支持，请联系我公司，我公司将竭力为您服务。<br><span style="color: #3498db;">`##` </span>一、脉冲电子围栏主机概述<br>1.1绝对安全，根据GB/T7946-2008要求研发制造，并通过了公安部的形式检验。<br>1.2误报率低和适应性强<br>智能型脉冲电子围栏系统基本不受环境(如树木、小动物、震动等)和气候(如风、雪、雨、雾等)的<br>影响，不受地形高低和曲折程度的限制，误报率极低。<br>1.3阻挡和报警双重功能<br>智能型脉冲电子围栏系统的新概念是把企图入侵者阻挡在防区之外，不作案为目的。<br>能够实实在在给入<br>侵者一种威慑感和阻挡作用，使其不敢轻举妄动，达到防范为主，减少作案次数。<br>1.4连续工作、布防/撤防，按需设定。<br>1.6可根据用户要求和现场地理环境以及安全等级进行设计和安装。<br>并可和多种现代安防产品，例如电视监控系统、安防报警系统配套使用，以提高系统的安全防范等级。<br>1.7绝对安全及报警感知性<br>传统的高压脉冲电网警戒系统没有报警感知功能，仅仅以高压、大电流的方式阻止入侵者，极易造成入<br>侵者伤残，甚至死亡等严重后果。<br>智能型脉冲电子围栏系统采用了低能量的脉冲高压(5\~10KV)。<br>由于能量<br>极低且作用时间极为短暂，因而对人体不会造成伤害。<br>一旦触及，也会因直接有触电感而离开。<br><span style="color: #3498db;">`##` </span>二、中文LCD控制键盘特点及性能参数<br><span style="color: #3498db;">`###` </span>功能特点:<br>1.可接128台脉冲电子围栏，中文液晶显示，两路RS485总线通讯接口，方便现场安装施工;<br>2.采用中文液晶显示，显示直观，操作方便<br>3.可同时远程控制128台高压脉冲围栏控制器<br>4.可以实时显示和控制各围栏控制器的状态(脉冲电压幅值、布防/撤防状态)<br>5.报警时显示对应防区的报警类型(防拆、短路、断线、短接)，同时有声音提示<br>6.一键布/撤防功能<br>7.可以查询报警历史记录.<br>8.可以实时显示线上电压<br>9.可查询操作记录防止管理人员对系统乱撤防等;<br>10.可控制前端继电器模块输出信号;<br>11.支持遥控器高，低压布防，撤防，复位等;<br>12.六个LED指示灯显示系统工作状态;<br>13.自带一路12V800MA电压报警输出及一路常开常闭信号可选输出;<br>14.可存储100条报警记录，及100条操作记录;<br><span style="color: #3498db;">`###` </span>技术参数:<br>尺寸(长x宽x厚):19.5x14x2.9cm<br>重量:250克<br>工作环境:-20℃ +50℃;-0-85%湿度<br>工作电压:直流:12伏\~16伏<br>工作电流(直流):静态50毫安;报警100毫安<br>中文液晶显示，显示控制设备的各类信息，包括报警、状态等。<br><span style="color: #3498db;">`#` </span>第二章:中文LCD控制键盘说明<br><span style="color: #3498db;">`##` </span>一.中文LCD控制键盘面板示意图:<br>(中文LCD控制键盘图)<br>图片占位符<br>1.正常有电状态时，电源指示灯亮<br>2.系统运行时，运行指示灯亮<br>3.键盘布防时，布防指示灯亮<br>4.系统有报警时，报警指示灯亮<br>5.有无线遥控器的控制信号时，信号指示灯亮<br><span style="color: #3498db;">`##` </span>二.接线端口<br>1.RS485通讯口2:键盘第二二路485 通讯接口;<br>2.RS485通讯口1:键盘第一路485通讯接口;<br>3. 12V， GND:为键盘12V供电接入口;<br>4.开关量:键盘报警开关量输出接口(常开，常闭可选，在键盘内部继电器旁的JP跳针);<br>5.警号输出接口:"+"接警号正极，"一"接警号负极;<br>(接线端口示意图)<br>图片占位符<br><span style="color: #3498db;">`#` </span>第三章:编程设置<br>注:系统初始密码为:8888;安装调试完成后，请第一时间修改系统密码!<br><span style="color: #3498db;">`##` </span>一.系统菜单项及编程设置<br><span style="color: #3498db;">`###` </span>1.1系统上电初始化界面，显示公司名称及欢迎界面:<br>图片占位符<br>(欢迎使用界面)<br><span style="color: #3498db;">`###` </span>1.2 报警信息显示界面及防区状态循环界面:<br>(防区状态循环界面)<br>图片占位符<br>图片占位符<br>(报警信息显示界面)<br>在此两界面下，按"↑""↓"键可来回切换;在报警界面下，Alarm:后面的数字表示当前的防区报警数量;All:后面的数字表示系统总共防区数量。<br><span style="color: #3498db;">`###` </span>1.3系统功能参数设置:<br>按下键盘上的"菜单"键后，可调出进入至"设置系统参数"主界面;如下图:<br>图片占位符<br>此时光标条产生背景对比度，以示当时选定的菜单项;此时按下"确定"键后，提示输入密码:输入完密码后即可进入到"设置系统参数"的二级菜单页;如下图:<br>图片占位符<br>(输入密码界面，密码为4位，输入正确后自动进入二级菜单)<br>图片占位符<br>(设置系统参数二级菜单界面)<br><span style="color: #3498db;">`###` </span>1.4防区设置(增加/删除防区)<br>在"设置系统参数"菜单下，通过按"↓"键，选中"防区设置"后，按"确定"键进入菜单;如下图:<br>图片占位符<br>(防区设置界面)<br>态;<br><span style="color: #3498db;">`####` </span>1.4.1增加防区<br>***,按"确定"键后即可增加相应编号的防区，反复操作即可增加更多的防区;如下图:<br>图片占位符<br>(增加防区界面)<br><span style="color: #3498db;">`####` </span>1.4.2删除防区<br>在"防区设置界面"通过"↑""↓"键选中预删除的防区号，按一下键盘上的"删除"键后，弹出删除提示菜单后，按键盘上的"确定"键后即可删除当前防区;如下图:<br>图片占位符<br>(删除防区界面)<br><span style="color: #3498db;">`###` </span>1.5快速布撤防操作<br>在"设置系统参数"菜单下，通过按"↓"键，选择"快速布撤防操作"后，按下"确定"键后进入至"快速布撤防操作"菜单，此时再通过"↑""↓"键选中预对围栏系统进行的操作后按下"确定"键即可;如下图:<br>图片占位符<br>(快速布撤防界面)<br><span style="color: #3498db;">`###` </span>1.6单防区操作<br>在"设置系统参数"菜单下，通过"↑""↓"键选择"单防区操作"后，按下"确定"键后进入至"单防区操作"菜单，如下图:<br>图片占位符<br>(单防区操作界面)<br>在"单防区操作"界面，通过"↑""↓"键定位光标，输入预单防区操作的防区号:10(假设值)，然后按"↓"键将光标下移到电压设置行:(按"2"为高压，"1"为低压);再按"↓"键将光标下移到设置状态行:(按"0"为撤防，"1"为布防)，再按"确定"键即可对前端对应防区号的围栏主机进行相应的操作。<br><span style="color: #3498db;">`###` </span>1.7定时布撤防设置<br>在"设置系统参数"菜单下，通过""键选择"定时布撤防设置"后，按下"确定"键后进入至"定时布撤防设置"菜单，如下图:<br>图片占位符<br>(定时布撤防设置界面)<br>通过"↑""↓"键可移动光标，输入预计的时间段;移至时间段最未端时，通过按下"0/1/2/3"键设置该时间段要进行的定时操作("0"=不操作，"1"=高压布防，"2"=低压布防，"3"=撤防);<br><span style="color: #3498db;">`###` </span>1.8触发时间设置<br>在"设置系统参数"菜单下，通过"↑""↓"键选择"触发时间设置"后，按下"确定"键后进入至"触发时间设置"菜单，如下图:<br>图片占位符<br>(触发时间设置界面)<br>输入需设置围栏主机报警触发的时间参数(以秒为单位，最大3位数)后按下"确定"键即可，按"取消"键可退格时间参数重新输入时间。<br><span style="color: #3498db;">`###` </span>1.9报警时间设置<br>在"设置系统参数"菜单下，通过"键选择"报警时间设置"后，按下"确定"键后进入至"报警时间设置"菜单，如下图:<br>图片占位符<br>(报警时间设置界面)<br>输入需设置围栏主机及中文LCD控制键盘报警的时间参数(以秒为单位，最大3位数)后按下"确定"键即可，按"取消"键可退格时间参数重新输入时间。<br>报警时间参数即为前端每台围栏主机的报警后自动<br>恢复的时间值及中文控制键盘的报警时间。<br><span style="color: #3498db;">`###` </span>1.10防区号设置<br>在"设置系统参数"菜单下，通过"↑""↓"键选择"防区号设置"后，按下"确定"键后进入至"防区号设置"菜单，如下图:<br>图片占位符<br>(防区号设置界面)<br>通过"↑""↓"键移光标，输入旧防区号及新防区号后，按下"确定"即可将前端围栏主机的旧防区号改成新的防区号(注:假设前端围栏主机的防区号为"1"，要改成新的防区号为"2"，此时在此界面旧防区号输入:1，新防区号输入:2，确定完后，原先防区号为"1"的围栏主机就变成了防区号为"2")。<br><span style="color: #3498db;">`###` </span>1.11键盘模式设置<br>在"设置系统参数"菜单下，通过"↑键选择"键盘模式设置"后，按下"确定"键后进入至"键盘模式设置"菜单，如下图:<br>图片占位符<br>(键盘模式设置界面)<br>通过"↑""↓"键移光标，输入键盘的编号:后按下"确定"键光标移动至键盘模式行，按下"0"表示将此键盘设置为从键盘模式，按下"1"表示将此键盘设置为主键盘模式(注:"0"=从键盘，"1"=主键盘，从键盘只能显示防区状态及防区报警信息，不能对整个系统进行布防，撤防等操作);<br><span style="color: #3498db;">`###` </span>1.12时间设置<br>在"设置系统参数"菜单下，通过按"↑""↓"键选择"时间设置"后，按下"确定"键后进入至"时间设置"菜单，如下图:<br>图片占位符<br>(时间设置界面)<br>通过按"↑""↓"键移动光标，输入相应的时间年，月，日，小时，分钟后，按下"确定"键，设置时间完毕。<br><span style="color: #3498db;">`###` </span>1.13密码设置<br>在"设置系统参数"菜单下，通过按"↑""↓"键选择"密码设置"后，按下"确定"键后进入至"密码设置"菜单，如下图:<br>图片占位符<br><span style="color: #3498db;">`####` </span>(密码设置界面)<br>输入新的4位密码:\*\*\*\*，，输错密码值时，可按"取消"键退格删除数字以重新输入新的密码，再按"确定"键完成密码的修改;<br><span style="color: #3498db;">`###` </span>1.14恢复出厂时设置<br>在"设置系统参数"菜单下，通过按"↑""↓"键选择"恢复出厂时设置"后，按下"确定"键后进入至"恢复出厂时设置"菜单，如下图:<br>图片占位符<br>(恢复出厂时设置界面)<br>注:按下"确定"键即可将键盘的所有参数恢复至出厂默认参数;请在厂家的指导下谨慎操作!<br><span style="color: #3498db;">`###` </span>1.15删除报警记录<br>在主菜单下，通过按"↑""↓"键选择"删除报警记录"后，按下"确定"键后提示输入密码:\*\*\*\* ,输入正确密码后，进入至"确定删除所有记录?"界面，按下"确定"键后，删除成功同时提示"无更多记录";如下图:<br>图片占位符<br><span style="color: #3498db;">`###` </span>1.16删除操作记录<br>(删除记录确定界面)<br>在主菜单下，通过按"↑""↓"键选择"删除操作记录"后，按下"确定"键后提示输入密码:\*\*\*\*，输入正确密码后，进入至"确定删除所有记录?"界面，按下"确定"键后，删除成功同时提示"无更多记录";如下图:<br>图片占位符<br>(删除记录确定界面)<br><span style="color: #3498db;">`#` </span>第四章:系统日常操作<br>注:系统初始密码为:8888;安装调试完成后，请第一时间修改系统密码!<br><span style="color: #3498db;">`##` </span>一.快速高低压布防<br>在系统"防区状态循环界面"或者"报警信息显示界面"下，如果系统当前菜单页不在此两界面下时，可通过按"菜单"键来切换至"防区状态循环界面"和"报警信息显示界面";然后按"布防"键后，提示输入密码:\*\*\*\*即可进入"快速布防"菜单页;此时通过按"↑""↓"键选中需要进行"快速高压布防"或者"快速低压布防"后，按下"确定"键即可对整个系统进行相应的高压/低压布防操作;如下图:<br>图片占位符<br><span style="color: #3498db;">`##` </span>二.快速撤防<br>(快速布防界面)<br>在系统"防区状态循环界面"或者"报警信息显示界面"下，如果系统当前菜单页不在此两界面下时，可通过按"菜单"键来切换至"防区状态循环"界面和"报警信息显示"界面;然后按"撤防"键后，提示输入密码:\*\*\*\*即可进入至"快速撤防"菜单页;按下"确定"键即可对整个系统进行相应的撤防操作;如下图:<br>图片占位符<br><span style="color: #3498db;">`##` </span>三.报警复位<br>(快速撤防界面)<br>当系统前端有围栏主机或者地址模块防区被触发时，键盘自动切换到"报警信息显示"界面，如下图:<br>"报警信息显示"显示了当前的报警防区数量，及报警的触发条件(防拆，短路，断线，短接，模块防区报警);在报警触发时，键盘产生报警输出，同时前端围栏主机输出12V电压信号和开关量信号，此时按下"复位"键后，键盘报警恢复正常，同时前端围栏主机也恢复正常状态;且LCD控制键盘界面显示"当前无报警防区";如下图:<br>图片占位符<br><span style="color: #3498db;">`##` </span>四:无线遥控器快速操作<br>下图:随金可以过过出厂围置药4继无线境的网时隔统进行"南打用用中限，围际，发位"操作:<br>图片占位符<br><span style="color: #3498db;">`##` </span>五:报警记录查询<br>按下"菜单"键，让键盘切换到一级主菜下，通过"↑""↓"键选中"报警记录查询"即可进入报警查询菜单，此时显示当前最新一条报警的信息，可通过"↑""↓"键一条一条的查询;如下图:<br>图片占位符 |
+| **Question Rewriting✍️** | Q1： What do the five mountains in China mean?<br>A1： China's Five Mountains refer to five famous peaks located in China, and they are:...<br>Q2： Among them, in which year Huashan was rated as an AAAAAA scenic spot...<br>A2：2011<br>根据以上已知条件和问答内容，理解以下问题意图，并将问题以完整的形式输出:<br>Q3：What about Mount Tai? | In which year was Mount Taishan rated as an AAAAA scenic spot. |
+| **Text Segmentation📋** | LT-02A Infrared Thermometer Manual<br>1 Introduction<br>Thank you for choosing the LT-02A series temperature sensor.<br>The infrared temperature sensor can calculate the surface temperature of an object by measuring the infrared radiation emitted by the target without contact.<br>Non-contact temperature measurement is the biggest advantage of infrared thermometers, allowing users to easily measure targets that are difficult to access or are moving.<br>The LT-02A series temperature sensor is an integrated infrared temperature sensor where the sensor, optical system, and electronic circuitry are all housed within a stainless steel casing. The LT-02A series is easy to install, with standard threads on the metal casing for quick connection to mounting points. Additionally, the LT-02A series offers various options (such as air purgers, mounting brackets, adjustable mounting brackets, air purge protection sleeves, etc.) to meet the requirements of various working conditions.<br>2 Parameter Description<br>a. Basic Performance<br>Protection rating IP65 (NEMA-4)<br>Ambient temperature 0\~60°C<br>Storage temperature -20\~80°C<br>Relative humidity 10-95% (non-condensing)<br>Material Stainless steel<br>Cable length 1.5m (standard), other special specifications (customizable)<br>b. Electrical Parameters<br>Operating power supply 24 VDC<br>Maximum current 50mA<br>Output signal 4\~20mA or 0-5V linear<br>c. Measurement Parameters<br>Spectral range 8\~14μm<br>Temperature range 0\~200°C<br>Optical resolution 20:1<br>Response time 50 ms (95%)<br>Temperature measurement accuracy ±0.5% of reading or ±0.5°C, whichever is greater<br>Repeat accuracy ±0.5% of reading or ±0.5°C, whichever is greater Dimensions 113mm x φ18mm (length * diameter)<br>Emissivity 0.95 fixed<br>d. Optical Path Diagram<br>Image placeholder<br>3 Working Principle and Precautions<br>a. Infrared Temperature Measurement Principle<br>All objects emit infrared energy, and the radiation intensity varies with temperature.<br>Infrared thermometers generally use infrared radiation energy within the wavelength range of 0.8μm to 18μm.<br>An infrared temperature sensor is a photoelectric sensor that receives infrared radiation and converts it into an electrical signal, which is then processed through electronic circuit amplification, linearization, and signal processing to display or output temperature.<br>b. Maximum Distance and Size of the Measured Point.<br>The size of the target and the optical characteristics of the infrared thermometer determine the maximum distance between the target and the measurement head.<br>To avoid measurement errors, the target should ideally fill the field of view of the detector.<br>Therefore, the measured point should always be smaller than the object or at least the same size as the target.<br>C.<br>Ambient Temperature<br>The LT-02A series infrared temperature sensor can operate within an ambient temperature range of 0-60°C.<br>Otherwise, please select a cooling protection sleeve.<br>d. Lens Cleaning<br>The instrument's lens must be kept clean to avoid measurement errors or even lens damage caused by contaminants such as dust and smoke. If dust adheres to the lens, it can be wiped clean with lens paper dipped in anhydrous alcohol.<br>e. Electromagnetic Interference<br>To prevent electromagnetic interference, please ensure the following measures:<br>During installation, keep the infrared temperature sensor as far away as possible from sources of electromagnetic fields (such as electric motors, engines, high-power cables, etc.). If necessary, use a metal conduit.<br>4 Installation<br>a Mechanical Installation<br>The LT-02A series metal housing features an M18x1 thread, allowing for direct installation or installation via a mounting bracket. An adjustable mounting bracket facilitates easier adjustment of the measurement head.<br>When aligning the target with the measurement head, ensure the optical path is unobstructed.<br>b Electrical Installation Wiring<br>Table placeholder<br>For 4\~20mA analog signal output.<br>It uses a two-wire loop current output method. The connection to a display or controller has the following two typical applications (connection methods):<br>Display/controller internally provides 24V power supply<br>Image placeholder<br>5 Dimensions and Options<br>a. Dimensions<br>Image placeholder<br>Figure 5-1a Dimensions<br>Image placeholder<br>Figure 5-1b Dimensions<br>Image placeholder<br>Cooling Jacket Dimensions<br>Image placeholder<br>Air Purge Cooling Jacket<br>6 Packing List<br>Standard Accessories:<br>LT-02A series temperature sensor (with 1.5-meter cable), fixing nut, user manual.<br>Please check the product packaging for any damage. Immediately notify your local agent if any damage is found, and retain the damaged packaging for inspection.<br>You can find the product serial number on the product label.<br>Please provide the serial number when contacting customer service for maintenance, ordering parts, or repairs.<br>7 Maintenance<br>If you encounter any issues while using the LT-02A series temperature sensor, please contact our service department.<br>Our customer service team will provide technical support regarding temperature sensor setup, calibration procedures, and maintenance.<br>Experience shows that these issues can usually be resolved over the phone. Please contact our customer service before deciding to return the instrument.<br>8 Warranty<br>Each instrument undergoes quality inspection procedures. If any issues occur, contact your service provider immediately.<br>The instrument has a 12-month warranty from the date of shipment. After expiration, the manufacturer provides an additional 6-month warranty for repairs or component replacement.<br>Damage caused by unauthorized disassembly or improper use is not covered by the warranty.<br>During the warranty period, faulty instruments will be replaced, calibrated, or repaired free of charge, with shipping costs borne by the sender.<br>The manufacturer reserves the right to repair the instrument or replace components.<br>If the malfunction is due to user misuse, the user must bear the repair costs and may inquire about charges in advance. | LT-02A Infrared Thermometer Manual<br><span style="color: #3498db;">`#` </span>1 Introduction<br>Thank you for choosing the LT-02A series temperature sensor.<br>The infrared temperature sensor can calculate the surface temperature of an object by measuring the infrared radiation emitted by the target without contact.<br>Non-contact temperature measurement is the biggest advantage of infrared thermometers, allowing users to easily measure targets that are difficult to access or are moving.<br>The LT-02A series temperature sensor is an integrated infrared temperature sensor where the sensor, optical system, and electronic circuitry are all housed within a stainless steel casing.<br>The LT-02A series is easy to install, with standard threads on the metal casing for quick connection to mounting points.<br>Additionally, the LT-02A series offers various options (such as air purgers, mounting brackets, adjustable mounting brackets, air purge protection sleeves, etc.)<br>to meet the requirements of various working conditions.<br><span style="color: #3498db;">`#` </span>2 Parameter Description<br><span style="color: #3498db;">`##` </span>a. Basic Performance<br>Protection rating IP65 (NEMA-4)<br>Ambient temperature 0\~60°C<br>Storage temperature -20\~80°C<br>Relative humidity 10-95% (non-condensing)<br>Material Stainless steel<br>Cable length 1.5m (standard), other special specifications (customizable)<br><span style="color: #3498db;">`##` </span>b. Electrical Parameters<br>Operating power supply 24 VDC<br>Maximum current 50mA<br>Output signal 4\~20mA or 0-5V linear<br><span style="color: #3498db;">`##` </span>c. Measurement Parameters<br>Spectral range 8\~14μm<br>Temperature range 0\~200°C<br>Optical resolution 20:1<br>Response time 50 ms (95%)<br>Temperature measurement accuracy ±0.5% of reading or ±0.5°C, whichever is greater<br>Repeat accuracy ±0.5% of reading or ±0.5°C, whichever is greater Dimensions 113mm x φ18mm (length * diameter)<br>Emissivity 0.95 fixed<br><span style="color: #3498db;">`##` </span>d. Optical Path Diagram<br>Image placeholder<br><span style="color: #3498db;">`#` </span>3 Working Principle and Precautions<br><span style="color: #3498db;">`##` </span>a. Infrared Temperature Measurement Principle<br>All objects emit infrared energy, and the radiation intensity varies with temperature.<br>Infrared thermometers generally use infrared radiation energy within the wavelength range of 0.8μm to 18μm.<br>An infrared temperature sensor is a photoelectric sensor that receives infrared radiation and converts it into an electrical signal, which is then processed through electronic circuit amplification, linearization, and signal processing to display or output temperature.<br><span style="color: #3498db;">`##` </span>b. Maximum Distance and Size of the Measured Point.<br>The size of the target and the optical characteristics of the infrared thermometer determine the maximum distance between the target and the measurement head.<br>To avoid measurement errors, the target should ideally fill the field of view of the detector.<br>Therefore, the measured point should always be smaller than the object or at least the same size as the target.<br><span style="color: #3498db;">`##` </span>C.<br><span style="color: #3498db;">`##` </span>Ambient Temperature<br>The LT-02A series infrared temperature sensor can operate within an ambient temperature range of 0-60°C.<br>Otherwise, please select a cooling protection sleeve.<br><span style="color: #3498db;">`##` </span>d. Lens Cleaning<br>The instrument's lens must be kept clean to avoid measurement errors or even lens damage caused by contaminants such as dust and smoke.<br>If dust adheres to the lens, it can be wiped clean with lens paper dipped in anhydrous alcohol.<br><span style="color: #3498db;">`##` </span>e. Electromagnetic Interference<br>To prevent electromagnetic interference, please ensure the following measures:<br>During installation, keep the infrared temperature sensor as far away as possible from sources of electromagnetic fields (such as electric motors, engines, high-power cables, etc.).<br>If necessary, use a metal conduit.<br><span style="color: #3498db;">`#` </span>4 Installation<br><span style="color: #3498db;">`##` </span>a Mechanical Installation<br>The LT-02A series metal housing features an M18x1 thread, allowing for direct installation or installation via a mounting bracket.<br>An adjustable mounting bracket facilitates easier adjustment of the measurement head.<br>When aligning the target with the measurement head, ensure the optical path is unobstructed.<br><span style="color: #3498db;">`##` </span>b Electrical Installation Wiring<br>Table placeholder<br>For 4\~20mA analog signal output.<br>It uses a two-wire loop current output method.<br>The connection to a display or controller has the following two typical applications (connection methods):<br>Display/controller internally provides 24V power supply<br>Image placeholder<br><span style="color: #3498db;">`#` </span>5 Dimensions and Options<br><span style="color: #3498db;">`##` </span>a. Dimensions<br>Image placeholder<br>Figure 5-1a Dimensions<br>Image placeholder<br>Figure 5-1b Dimensions<br>Image placeholder<br>Cooling Jacket Dimensions<br>Image placeholder<br>Air Purge Cooling Jacket<br><span style="color: #3498db;">`#` </span>6 Packing List<br>Standard Accessories:<br>LT-02A series temperature sensor (with 1.5-meter cable), fixing nut, user manual.<br>Please check the product packaging for any damage.<br>Immediately notify your local agent if any damage is found, and retain the damaged packaging for inspection.<br>You can find the product serial number on the product label.<br>Please provide the serial number when contacting customer service for maintenance, ordering parts, or repairs.<br><span style="color: #3498db;">`#` </span>7 Maintenance<br>If you encounter any issues while using the LT-02A series temperature sensor, please contact our service department.<br>Our customer service team will provide technical support regarding temperature sensor setup, calibration procedures, and maintenance.<br>Experience shows that these issues can usually be resolved over the phone.<br>Please contact our customer service before deciding to return the instrument.<br><span style="color: #3498db;">`#` </span>8 Warranty<br>Each instrument undergoes quality inspection procedures.<br>If any issues occur, contact your service provider immediately.<br>The instrument has a 12-month warranty from the date of shipment.<br>After expiration, the manufacturer provides an additional 6-month warranty for repairs or component replacement.<br>Damage caused by unauthorized disassembly or improper use is not covered by the warranty.<br>During the warranty period, faulty instruments will be replaced, calibrated, or repaired free of charge, with shipping costs borne by the sender.<br>The manufacturer reserves the right to repair the instrument or replace components.<br>If the malfunction is due to user misuse, the user must bear the repair costs and may inquire about charges in advance.<br> |
+> **Note**: For specialized tasks, in-domain post-training is further applied.

assets/general_agentic_instruct.png ADDED Viewed

Git LFS Details

SHA256: 93416b35f45fb33972740564cdf38b5c0ec74e6e305de47843bee152b6677357
Pointer size: 131 Bytes
Size of remote file: 572 kB

assets/youtu-llm-logo.png ADDED Viewed

Git LFS Details

SHA256: 83625a8be39c17aca9cd9185f2984ce545a88b3eeb475afb9c25afeea87e10b8
Pointer size: 131 Bytes
Size of remote file: 299 kB

chat_template.jinja ADDED Viewed

	@@ -0,0 +1 @@

+ {% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% set ns = namespace(is_first=false, is_tool=false, is_tool_message=false, first_tool_index=messages|length, is_output_first=true, system_prompt='', is_first_sp=true, is_last_user=false) %}{% for message in messages %}{% if message['role'] == 'system' %}{% if ns.is_first_sp %}{% set ns.system_prompt = ns.system_prompt + message['content'] %}{% set ns.is_first_sp = false %}{% else %}{% set ns.system_prompt = ns.system_prompt + '\n\n' + message['content'] %}{% endif %}{% endif %}{% if not ns.is_tool_message and (message['role'] == 'tool' or (message['role'] == 'user' and message['content'].startswith('<tool_response>') and message['content'].endswith('</tool_response>'))) %}{% set ns.is_tool_message = true %}{% set ns.first_tool_index = loop.index0 %}{% endif %}{% endfor %}{% if tools is defined and tools is not none %}{% set tool_ns = namespace(text='<|begin_of_tool_description|>Tool calling capabilities.\nYou may call one or more functions to assist with the user query. You have the following functions available:', return_text='For tool call returns, you MUST use the following format:\n<tool_call>{\"name\": \"function-name\", \"arguments\": {\"param1\": \"value1\", \"param2\": \"value2\"}}</tool_call>\n<|end_of_tool_description|>') %}{% for tool in tools %}{% set tool_ns.text = tool_ns.text + '\n```json\n' + (tool | tojson) + '\n```' %}{% endfor %}{% set tool_ns.text = tool_ns.text + '\n' + tool_ns.return_text %}{% if ns.system_prompt == '' %}{% set ns.system_prompt = tool_ns.text %}{% else %}{% set ns.system_prompt = ns.system_prompt + '\n\n' + tool_ns.text %}{% endif %}{% endif %}{{ bos_token }}{{ ns.system_prompt }}{% for message in messages %}{% set content = message['content'] %}{% if message['role'] == 'user' %}{% set ns.is_tool = false %}{% set ns.is_first = false %}{% set ns.is_last_user = true %}{{ '<|User|>' + content }}{% endif %}{% if message['role'] == 'assistant' %}{% if '</think>' in content and not loop.last and loop.index0 < (ns.first_tool_index - 1) %}{% set content = content.rsplit('</think>')[-1].lstrip('\n') %}{% endif %}{% if '<think>' not in content and '</think>' not in content and loop.last %}{% set content = '<think>\n\n</think>\n\n' + content %}{% endif %}{% endif %}{% if message['role'] == 'assistant' and message['tool_calls'] is defined and message['tool_calls'] is not none %}{% set ns.is_last_user = false %}{{ '<|Assistant|>' }}{% if content is not none %}{{ content }}{% endif %}{% set ns.is_first = false %}{% set ns.is_tool = false %}{% set ns.is_output_first = true %}{% for tool in message['tool_calls'] %}{% if tool['function']['arguments'] is string %}{% set tool_call_str = '{\"name\": \"' + tool['function']['name'] + '\", \"arguments\": ' + tool['function']['arguments'] + '}' %}{% else %}{% set tool_call_str = '{\"name\": \"' + tool['function']['name'] + '\", \"arguments\": ' + tool['function']['arguments']|tojson + '}' %}{% endif %}{% if not ns.is_first %}{{ '<tool_call>' + tool_call_str + '</tool_call>' }}{% set ns.is_first = true %}{% else %}{{ '\n' + '<tool_call>' + tool_call_str + '</tool_call>' }}{% endif %}{% endfor %}{{ '<|end_of_text|>' }}{% endif %}{% if message['role'] == 'assistant' and (message['tool_calls'] is not defined or message['tool_calls'] is none)%}{% set ns.is_last_user = false %}{% set ns.is_tool = false %}{% set ns.is_output_first = true %}{{ '<|Assistant|>' + content + '<|end_of_text|>' }}{% endif %}{% if message['role'] == 'tool' %}{% set ns.is_last_user = false %}{% set ns.is_tool = true %}{% if ns.is_output_first %}{{ '<|User|><tool_response>' + content + '</tool_response>' }}{% set ns.is_output_first = false %}{% else %}{{ '\n<tool_response>' + content + '</tool_response>' }}{% endif %}{% endif %}{% endfor %}{% if add_generation_prompt and (ns.is_last_user or ns.is_tool) %}{{ '<|Assistant|>' }}{% if enable_thinking is defined and enable_thinking is false %}{{ '<think>\n\n</think>\n\n' }}{% elif forced_thinking is defined and forced_thinking is true %}{{ '<think>\n' }}{% endif %}{% endif %}

config.json ADDED Viewed

	@@ -0,0 +1,39 @@

+{
+    "architectures": [
+      "YoutuForCausalLM"
+    ],
+    "attention_bias": false,
+    "attention_dropout": 0.0,
+    "auto_map": {
+      "AutoConfig": "configuration_youtu.YoutuConfig",
+      "AutoModel": "modeling_youtu.YoutuModel",
+      "AutoModelForCausalLM": "modeling_youtu.YoutuForCausalLM"
+    },
+    "bos_token_id": 128000,
+    "eos_token_id": 128001,
+    "hidden_act": "silu",
+    "hidden_size": 2048,
+    "initializer_range": null,
+    "embedding_initializer_range": null,
+    "intermediate_size": 6144,
+    "kv_lora_rank": 512,
+    "max_position_embeddings": 131072,
+    "mlp_bias": false,
+    "model_type": "youtu_llm",
+    "num_attention_heads": 16,
+    "num_hidden_layers": 32,
+    "num_key_value_heads": 16,
+    "q_lora_rank": 1536,
+    "qk_nope_head_dim": 128,
+    "qk_rope_head_dim": 64,
+    "rms_norm_eps": 1e-06,
+    "rope_interleave": true,
+    "rope_scaling": null,
+    "rope_theta": 1600000,
+    "tie_word_embeddings": true,
+    "torch_dtype": "bfloat16",
+    "transformers_version": "4.56.0",
+    "use_cache": true,
+    "v_head_dim": 128,
+    "vocab_size": 128256
+}

configuration_youtu.py ADDED Viewed

	@@ -0,0 +1,198 @@

+# coding=utf-8
+# Copyright 2025 Tencent Youtu Lab and the HuggingFace Inc. team. All rights reserved.
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from transformers.configuration_utils import PretrainedConfig
+from transformers.modeling_rope_utils import rope_config_validation
+Youtu_PRETRAINED_CONFIG_ARCHIVE_MAP = {}
+class YoutuConfig(PretrainedConfig):
+    r"""
+    This is the configuration class to store the configuration of a [`YoutuModel`]. It is used to instantiate an Youtu
+    model according to the specified arguments, defining the model architecture. Instantiating a configuration with the
+    defaults will yield a similar configuration to that of the Youtu-LLM-2B.
+    e.g. [tencent/Youtu-LLM-2B](https://huggingface.co/tencent/Youtu-LLM-2B)
+    Configuration objects inherit from [`PretrainedConfig`] and can be used to control the model outputs. Read the
+    documentation from [`PretrainedConfig`] for more information.
+    Args:
+        vocab_size (`int`, *optional*, defaults to 128256):
+            Vocabulary size of the Deep model. Defines the number of different tokens that can be represented by the
+            `inputs_ids` passed when calling [`YoutuModel`]
+        hidden_size (`int`, *optional*, defaults to 2048):
+            Dimension of the hidden representations.
+        intermediate_size (`int`, *optional*, defaults to 6144):
+            Dimension of the MLP representations.
+        num_hidden_layers (`int`, *optional*, defaults to 32):
+            Number of hidden layers in the Transformer decoder.
+        num_attention_heads (`int`, *optional*, defaults to 16):
+            Number of attention heads for each attention layer in the Transformer decoder.
+        num_key_value_heads (`int`, *optional*, defaults to 16):
+            In MLA, num_key_value_heads=num_attention_heads.
+        kv_lora_rank (`int`, *optional*, defaults to 512):
+            Rank of the LoRA matrices for key and value projections.
+        q_lora_rank (`int`, *optional*, defaults to 1536):
+            Rank of the LoRA matrices for query projections.
+        qk_rope_head_dim (`int`, *optional*, defaults to 64):
+            Dimension of the query/key heads that use rotary position embeddings.
+        v_head_dim (`int`, *optional*, defaults to 128):
+            Dimension of the value heads.
+        qk_nope_head_dim (`int`, *optional*, defaults to 128):
+            Dimension of the query/key heads that don't use rotary position embeddings.
+        hidden_act (`str` or `function`, *optional*, defaults to `"silu"`):
+            The non-linear activation function (function or string) in the decoder.
+        max_position_embeddings (`int`, *optional*, defaults to 131072):
+            The maximum sequence length that this model might ever be used with.
+        initializer_range (`float`, *optional*, defaults to None):
+            The standard deviation of the truncated_normal_initializer for initializing all weight matrices, except embedding matrices.
+        embedding_initializer_range (`float`, *optional*, defaults to None):
+            The standard deviation of the truncated_normal_initializer for initializing all embedding matrices.
+        rms_norm_eps (`float`, *optional*, defaults to 1e-06):
+            The epsilon used by the rms normalization layers.
+        use_cache (`bool`, *optional*, defaults to `True`):
+            Whether or not the model should return the last key/values attentions (not used by all models). Only
+            relevant if `config.is_decoder=True`.
+        pad_token_id (`int`, *optional*):
+            Padding token id.
+        bos_token_id (`int`, *optional*, defaults to 128000):
+            Beginning of stream token id.
+        eos_token_id (`int`, *optional*, defaults to 128001):
+            End of stream token id.
+        tie_word_embeddings (`bool`, *optional*, defaults to `True`):
+            Whether to tie weight embeddings
+        rope_theta (`float`, *optional*, defaults to 1600000):
+            The base period of the RoPE embeddings.
+        rope_scaling (`Dict`, *optional*, defaults to `None`):
+            Dictionary containing the scaling configuration for the RoPE embeddings. Currently supports two scaling
+            strategies: linear and dynamic. Their scaling factor must be a float greater than 1. The expected format is
+            `{"type": strategy name, "factor": scaling factor}`. When using this flag, don't update
+            `max_position_embeddings` to the expected new maximum.
+        rope_interleave (`bool`, *optional*, defaults to `True`):
+            Whether to interleave the rotary position embeddings.
+        attention_bias (`bool`, defaults to `False`, *optional*, defaults to `False`):
+            Whether to use a bias in the query, key, value and output projection layers during self-attention.
+        attention_dropout (`float`, *optional*, defaults to 0.0):
+            The dropout ratio for the attention probabilities.
+    ```python
+    >>> from transformers import YoutuModel, YoutuConfig
+    >>> # Initializing a Youtu-LLM-2B style configuration
+    >>> configuration = YoutuConfig()
+    >>> # Accessing the model configuration
+    >>> configuration = model.config
+    ```"""
+    model_type = "youtu_llm"
+    keys_to_ignore_at_inference = ["past_key_values"]
+    base_model_tp_plan = {
+        "layers.*.mlp.gate_proj": "local_colwise",
+        "layers.*.mlp.up_proj": "local_colwise",
+        "layers.*.mlp.down_proj": "local_rowwise",
+        "layers.*.mlp": "gather",  # This is the only moment where results are gathered
+    }
+    base_model_pp_plan = {
+        "embed_tokens": (["input_ids"], ["inputs_embeds"]),
+        "layers": (["hidden_states", "attention_mask"], ["hidden_states"]),
+        "norm": (["hidden_states"], ["hidden_states"]),
+    }
+    def __init__(
+        self,
+        vocab_size=128256,
+        hidden_size=2048,
+        intermediate_size=6144,
+        num_hidden_layers=32,
+        num_attention_heads=16,
+        num_key_value_heads=16,
+        kv_lora_rank=512,
+        q_lora_rank=1536,
+        qk_rope_head_dim=64,
+        v_head_dim=128,
+        qk_nope_head_dim=128,
+        hidden_act="silu",
+        max_position_embeddings=131072,
+        initializer_range=None,
+        embedding_initializer_range=None,
+        rms_norm_eps=1e-6,
+        use_cache=True,
+        pad_token_id=None,
+        bos_token_id=128000,
+        eos_token_id=128001,
+        tie_word_embeddings=True,
+        rope_theta=1600000,
+        rope_scaling=None,
+        rope_interleave=True,
+        attention_bias=False,
+        attention_dropout=0.0,
+        **kwargs,
+    ):
+        self.vocab_size = vocab_size
+        self.max_position_embeddings = max_position_embeddings
+        self.hidden_size = hidden_size
+        self.intermediate_size = intermediate_size
+        self.num_hidden_layers = num_hidden_layers
+        self.num_attention_heads = num_attention_heads
+        self.kv_lora_rank = kv_lora_rank
+        self.q_lora_rank = q_lora_rank
+        self.qk_rope_head_dim = qk_rope_head_dim
+        self.v_head_dim = v_head_dim
+        self.qk_nope_head_dim = qk_nope_head_dim
+        self.qk_head_dim = qk_nope_head_dim + qk_rope_head_dim
+        self.head_dim = qk_rope_head_dim
+        self.rope_interleave = rope_interleave
+        # for backward compatibility
+        if num_key_value_heads is None:
+            num_key_value_heads = num_attention_heads
+        self.mlp_bias = False
+        self.num_key_value_heads = num_key_value_heads
+        self.hidden_act = hidden_act
+        # if initializer_range is None, set it to 2.0 / (5.0 * self.hidden_size) ** 0.5
+        self.initializer_range = (2.0 / (5.0 * self.hidden_size)) ** 0.5 if initializer_range is None else initializer_range
+        # if embedding_initializer_range is None, set it to 2.0 * self.initializer_range
+        self.embedding_initializer_range = self.initializer_range * 2.0 if embedding_initializer_range is None else embedding_initializer_range
+        self.rms_norm_eps = rms_norm_eps
+        self.use_cache = use_cache
+        self.rope_theta = rope_theta
+        self.rope_scaling = rope_scaling
+        self.attention_bias = attention_bias
+        self.attention_dropout = attention_dropout
+        # Validate the correctness of rotary position embeddings parameters
+        # BC: if there is a 'type' field, copy it it to 'rope_type'.
+        if self.rope_scaling is not None and "type" in self.rope_scaling:
+            self.rope_scaling["rope_type"] = self.rope_scaling["type"]
+        if self.rope_scaling is not None:
+            for key in ["beta_fast", "beta_slow", "factor"]:
+                if key in self.rope_scaling:
+                    self.rope_scaling[key] = float(self.rope_scaling[key])
+        rope_config_validation(self)
+        super().__init__(
+            pad_token_id=pad_token_id,
+            bos_token_id=bos_token_id,
+            eos_token_id=eos_token_id,
+            tie_word_embeddings=tie_word_embeddings,
+            **kwargs,
+        )
+__all__ = ["YoutuConfig"]

generation_config.json ADDED Viewed

	@@ -0,0 +1,11 @@

+{
+    "_from_model_config": true,
+    "bos_token_id": 128000,
+    "eos_token_id": 128001,
+    "do_sample": true,
+    "temperature": 1.0,
+    "top_k": 20,
+    "top_p": 0.95,
+    "transformers_version": "4.56.0",
+    "use_cache": false
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cf79fd0ade098cfa2fd78ba17592df25c9b9824cba3c1d87767c71146ef0b097
+size 4448502056

modeling_youtu.py ADDED Viewed

	@@ -0,0 +1,610 @@

+# coding=utf-8
+# Copyright 2025 Tencent Youtu lab, DeepSeek-AI and The HuggingFace Inc. team. All rights reserved.
+#
+# This code is based on EleutherAI's GPT-NeoX library and the GPT-NeoX
+# and OPT implementations in this library. It has been modified from its
+# original forms to accommodate minor architectural differences compared
+# to GPT-NeoX and OPT used by the Meta AI team that trained the model.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import math
+from typing import Callable, Optional, Union
+import torch
+import torch.nn.functional as F
+from torch import nn
+from transformers.activations import ACT2FN
+from transformers.cache_utils import Cache, DynamicCache
+from transformers.generation import GenerationMixin
+from transformers.integrations import use_kernel_forward_from_hub
+from transformers.masking_utils import create_causal_mask
+from transformers.modeling_flash_attention_utils import FlashAttentionKwargs
+from transformers.modeling_layers import GradientCheckpointingLayer
+from transformers.modeling_outputs import BaseModelOutputWithPast, CausalLMOutputWithPast
+from transformers.modeling_rope_utils import ROPE_INIT_FUNCTIONS, dynamic_rope_update
+from transformers.modeling_utils import ALL_ATTENTION_FUNCTIONS, PreTrainedModel
+from transformers.processing_utils import Unpack
+from transformers.utils import TransformersKwargs, auto_docstring, can_return_tuple
+from transformers.utils.deprecation import deprecate_kwarg
+from transformers.utils.generic import check_model_inputs
+from .configuration_youtu import YoutuConfig
+@use_kernel_forward_from_hub("RMSNorm")
+class YoutuRMSNorm(nn.Module):
+    def __init__(self, hidden_size, eps=1e-6):
+        """
+        YoutuRMSNorm is equivalent to T5LayerNorm
+        """
+        super().__init__()
+        self.weight = nn.Parameter(torch.ones(hidden_size))
+        self.variance_epsilon = eps
+    def forward(self, hidden_states):
+        input_dtype = hidden_states.dtype
+        hidden_states = hidden_states.to(torch.float32)
+        variance = hidden_states.pow(2).mean(-1, keepdim=True)
+        hidden_states = hidden_states * torch.rsqrt(variance + self.variance_epsilon)
+        return self.weight * hidden_states.to(input_dtype)
+    def extra_repr(self):
+        return f"{tuple(self.weight.shape)}, eps={self.variance_epsilon}"
+class YoutuRotaryEmbedding(nn.Module):
+    inv_freq: torch.Tensor  # fix linting for `register_buffer`
+    def __init__(self, config: YoutuConfig, device=None):
+        super().__init__()
+        # BC: "rope_type" was originally "type"
+        if hasattr(config, "rope_scaling") and config.rope_scaling is not None:
+            self.rope_type = config.rope_scaling.get("rope_type", config.rope_scaling.get("type"))
+        else:
+            self.rope_type = "default"
+        self.max_seq_len_cached = config.max_position_embeddings
+        self.original_max_seq_len = config.max_position_embeddings
+        self.config = config
+        self.rope_init_fn = ROPE_INIT_FUNCTIONS[self.rope_type]
+        inv_freq, self.attention_scaling = self.rope_init_fn(self.config, device)
+        self.register_buffer("inv_freq", inv_freq, persistent=False)
+        self.original_inv_freq = self.inv_freq
+    @torch.no_grad()
+    @dynamic_rope_update  # power user: used with advanced RoPE types (e.g. dynamic rope)
+    def forward(self, x, position_ids):
+        inv_freq_expanded = self.inv_freq[None, :, None].float().expand(position_ids.shape[0], -1, 1).to(x.device)
+        position_ids_expanded = position_ids[:, None, :].float()
+        device_type = x.device.type if isinstance(x.device.type, str) and x.device.type != "mps" else "cpu"
+        with torch.autocast(device_type=device_type, enabled=False):  # Force float32
+            freqs = (inv_freq_expanded.float() @ position_ids_expanded.float()).transpose(1, 2)
+            emb = torch.cat((freqs, freqs), dim=-1)
+            cos = emb.cos() * self.attention_scaling
+            sin = emb.sin() * self.attention_scaling
+        return cos.to(dtype=x.dtype), sin.to(dtype=x.dtype)
+class YoutuMLP(nn.Module):
+    def __init__(self, config, hidden_size=None, intermediate_size=None):
+        super().__init__()
+        self.config = config
+        self.hidden_size = config.hidden_size if hidden_size is None else hidden_size
+        self.intermediate_size = config.intermediate_size if intermediate_size is None else intermediate_size
+        self.mlp_bias = config.mlp_bias
+        self.gate_proj = nn.Linear(self.hidden_size, self.intermediate_size, bias=self.mlp_bias)
+        self.up_proj = nn.Linear(self.hidden_size, self.intermediate_size, bias=self.mlp_bias)
+        self.down_proj = nn.Linear(self.intermediate_size, self.hidden_size, bias=self.mlp_bias)
+        self.act_fn = ACT2FN[config.hidden_act]
+    def forward(self, x):
+        down_proj = self.down_proj(self.act_fn(self.gate_proj(x)) * self.up_proj(x))
+        return down_proj
+def rotate_half(x):
+    """Rotates half the hidden dims of the input."""
+    x1 = x[..., : x.shape[-1] // 2]
+    x2 = x[..., x.shape[-1] // 2 :]
+    return torch.cat((-x2, x1), dim=-1)
+def apply_rotary_pos_emb(q, k, cos, sin, position_ids=None, unsqueeze_dim=1):
+    """Applies Rotary Position Embedding to the query and key tensors.
+    Args:
+        q (`torch.Tensor`): The query tensor.
+        k (`torch.Tensor`): The key tensor.
+        cos (`torch.Tensor`): The cosine part of the rotary embedding.
+        sin (`torch.Tensor`): The sine part of the rotary embedding.
+        position_ids (`torch.Tensor`, *optional*):
+            Deprecated and unused.
+        unsqueeze_dim (`int`, *optional*, defaults to 1):
+            The 'unsqueeze_dim' argument specifies the dimension along which to unsqueeze cos[position_ids] and
+            sin[position_ids] so that they can be properly broadcasted to the dimensions of q and k. For example, note
+            that cos[position_ids] and sin[position_ids] have the shape [batch_size, seq_len, head_dim]. Then, if q and
+            k have the shape [batch_size, heads, seq_len, head_dim], then setting unsqueeze_dim=1 makes
+            cos[position_ids] and sin[position_ids] broadcastable to the shapes of q and k. Similarly, if q and k have
+            the shape [batch_size, seq_len, heads, head_dim], then set unsqueeze_dim=2.
+    Returns:
+        `tuple(torch.Tensor)` comprising of the query and key tensors rotated using the Rotary Position Embedding.
+    """
+    cos = cos.unsqueeze(unsqueeze_dim)
+    sin = sin.unsqueeze(unsqueeze_dim)
+    q_embed = (q * cos) + (rotate_half(q) * sin)
+    k_embed = (k * cos) + (rotate_half(k) * sin)
+    return q_embed, k_embed
+def repeat_kv(hidden_states: torch.Tensor, n_rep: int) -> torch.Tensor:
+    """
+    This is the equivalent of torch.repeat_interleave(x, dim=1, repeats=n_rep). The hidden states go from (batch,
+    num_key_value_heads, seqlen, head_dim) to (batch, num_attention_heads, seqlen, head_dim)
+    """
+    batch, num_key_value_heads, slen, head_dim = hidden_states.shape
+    if n_rep == 1:
+        return hidden_states
+    hidden_states = hidden_states[:, :, None, :, :].expand(batch, num_key_value_heads, n_rep, slen, head_dim)
+    return hidden_states.reshape(batch, num_key_value_heads * n_rep, slen, head_dim)
+def eager_attention_forward(
+    module: nn.Module,
+    query: torch.Tensor,
+    key: torch.Tensor,
+    value: torch.Tensor,
+    attention_mask: Optional[torch.Tensor],
+    scaling: float,
+    dropout: float = 0.0,
+    **kwargs: Unpack[TransformersKwargs],
+):
+    key_states = repeat_kv(key, module.num_key_value_groups)
+    value_states = repeat_kv(value, module.num_key_value_groups)
+    attn_weights = torch.matmul(query, key_states.transpose(2, 3)) * scaling
+    if attention_mask is not None:
+        causal_mask = attention_mask[:, :, :, : key_states.shape[-2]]
+        attn_weights = attn_weights + causal_mask
+    attn_weights = nn.functional.softmax(attn_weights, dim=-1, dtype=torch.float32).to(query.dtype)
+    attn_weights = nn.functional.dropout(attn_weights, p=dropout, training=module.training)
+    attn_output = torch.matmul(attn_weights, value_states)
+    attn_output = attn_output.transpose(1, 2).contiguous()
+    return attn_output, attn_weights
+def apply_rotary_pos_emb_interleave(q, k, cos, sin, position_ids=None, unsqueeze_dim=1):
+    r"""
+    TODO let's just use the original freqcis computation to not have the view
+    transpose + reshape! This is not optimized!
+    Applies Rotary Position Embedding to the query and key tensors.
+    Args:
+        q (`torch.Tensor`): The query tensor.
+        k (`torch.Tensor`): The key tensor.
+        cos (`torch.Tensor`): The cosine part of the rotary embedding.
+        sin (`torch.Tensor`): The sine part of the rotary embedding.
+        position_ids (`torch.Tensor`):
+            The position indices of the tokens corresponding to the query and key tensors. For example, this can be
+            used to pass offsetted position ids when working with a KV-cache.
+        unsqueeze_dim (`int`, *optional*, defaults to 1):
+            The 'unsqueeze_dim' argument specifies the dimension along which to unsqueeze cos[position_ids] and
+            sin[position_ids] so that they can be properly broadcasted to the dimensions of q and k. For example, note
+            that cos[position_ids] and sin[position_ids] have the shape [batch_size, seq_len, head_dim]. Then, if q and
+            k have the shape [batch_size, heads, seq_len, head_dim], then setting unsqueeze_dim=1 makes
+            cos[position_ids] and sin[position_ids] broadcastable to the shapes of q and k. Similarly, if q and k have
+            the shape [batch_size, seq_len, heads, head_dim], then set unsqueeze_dim=2.
+    Returns:
+        `tuple(torch.Tensor)` comprising of the query and key tensors rotated using the Rotary Position Embedding.
+    """
+    cos = cos.unsqueeze(unsqueeze_dim)
+    sin = sin.unsqueeze(unsqueeze_dim)
+    b, h, s, d = q.shape
+    q = q.view(b, h, s, d // 2, 2).transpose(4, 3).reshape(b, h, s, d)
+    b, h, s, d = k.shape
+    k = k.view(b, h, s, d // 2, 2).transpose(4, 3).reshape(b, h, s, d)
+    q_embed = (q * cos) + (rotate_half(q) * sin)
+    k_embed = (k * cos) + (rotate_half(k) * sin)
+    return q_embed, k_embed
+def yarn_get_mscale(scale=1, mscale=1):
+    if scale <= 1:
+        return 1.0
+    return 0.1 * mscale * math.log(scale) + 1.0
+class YoutuMLAttention(nn.Module):
+    """Multi-latent attention from 'DeepSeek-V2: A Strong, Economical, and Efficient Mixture-of-Experts Language Model' paper"""
+    def __init__(self, config: YoutuConfig, layer_idx: int):
+        super().__init__()
+        self.config = config
+        self.layer_idx = layer_idx
+        self.num_key_value_groups = config.num_attention_heads // config.num_key_value_heads
+        self.attention_dropout = config.attention_dropout
+        self.num_heads = config.num_attention_heads
+        self.rope_theta = config.rope_theta
+        self.q_lora_rank = config.q_lora_rank
+        self.qk_rope_head_dim = config.qk_rope_head_dim
+        self.kv_lora_rank = config.kv_lora_rank
+        self.v_head_dim = config.v_head_dim
+        self.qk_nope_head_dim = config.qk_nope_head_dim
+        self.qk_head_dim = config.qk_head_dim
+        self.is_causal = True
+        if self.q_lora_rank is None:
+            self.q_proj = nn.Linear(config.hidden_size, self.num_heads * self.qk_head_dim, bias=False)
+        else:
+            self.q_a_proj = nn.Linear(config.hidden_size, config.q_lora_rank, bias=config.attention_bias)
+            self.q_a_layernorm = YoutuRMSNorm(config.q_lora_rank)
+            self.q_b_proj = nn.Linear(config.q_lora_rank, self.num_heads * self.qk_head_dim, bias=False)
+        self.kv_a_proj_with_mqa = nn.Linear(
+            config.hidden_size,
+            self.kv_lora_rank + self.qk_rope_head_dim,
+            bias=config.attention_bias,
+        )
+        self.kv_a_layernorm = YoutuRMSNorm(self.kv_lora_rank)
+        self.kv_b_proj = nn.Linear(
+            self.kv_lora_rank,
+            self.num_heads * (self.qk_nope_head_dim + self.v_head_dim),
+            bias=False,
+        )
+        self.o_proj = nn.Linear(
+            self.num_heads * self.v_head_dim,
+            config.hidden_size,
+            bias=config.attention_bias,
+        )
+        self.scaling = self.qk_head_dim ** (-0.5)
+        if self.config.rope_scaling is not None:
+            mscale_all_dim = self.config.rope_scaling.get("mscale_all_dim", 0)
+            scaling_factor = self.config.rope_scaling["factor"]
+            if mscale_all_dim:
+                mscale = yarn_get_mscale(scaling_factor, mscale_all_dim)
+                self.scaling = self.scaling * mscale * mscale
+    @deprecate_kwarg("past_key_value", new_name="past_key_values", version="4.58")
+    def forward(
+        self,
+        hidden_states: torch.Tensor,
+        position_embeddings: tuple[torch.Tensor, torch.Tensor],
+        attention_mask: Optional[torch.Tensor],
+        past_key_values: Optional[Cache] = None,
+        cache_position: Optional[torch.LongTensor] = None,
+        **kwargs: Unpack[FlashAttentionKwargs],
+    ) -> tuple[torch.Tensor, Optional[torch.Tensor], Optional[tuple[torch.Tensor]]]:
+        batch_size, seq_length = hidden_states.shape[:-1]
+        query_shape = (batch_size, seq_length, -1, self.qk_head_dim)
+        key_shape = (batch_size, seq_length, -1, self.qk_nope_head_dim + self.v_head_dim)
+        if self.q_lora_rank is None:
+            q_states = self.q_proj(hidden_states)
+        else:
+            q_states = self.q_b_proj(self.q_a_layernorm(self.q_a_proj(hidden_states)))
+        q_states = q_states.view(query_shape).transpose(1, 2)
+        q_pass, q_rot = torch.split(q_states, [self.qk_nope_head_dim, self.qk_rope_head_dim], dim=-1)
+        compressed_kv = self.kv_a_proj_with_mqa(hidden_states)
+        k_pass, k_rot = torch.split(compressed_kv, [self.kv_lora_rank, self.qk_rope_head_dim], dim=-1)
+        k_pass = self.kv_b_proj(self.kv_a_layernorm(k_pass)).view(key_shape).transpose(1, 2)
+        k_pass, value_states = torch.split(k_pass, [self.qk_nope_head_dim, self.v_head_dim], dim=-1)
+        k_rot = k_rot.view(batch_size, 1, seq_length, self.qk_rope_head_dim)
+        cos, sin = position_embeddings
+        if self.config.rope_interleave:  # support using interleaved weights for efficiency
+            q_rot, k_rot = apply_rotary_pos_emb_interleave(q_rot, k_rot, cos, sin)
+        else:
+            q_rot, k_rot = apply_rotary_pos_emb(q_rot, k_rot, cos, sin)
+        k_rot = k_rot.expand(*k_pass.shape[:-1], -1)
+        query_states = torch.cat((q_pass, q_rot), dim=-1)
+        key_states = torch.cat((k_pass, k_rot), dim=-1)
+        if past_key_values is not None:
+            # sin and cos are specific to RoPE models; cache_position needed for the static cache
+            cache_kwargs = {"sin": sin, "cos": cos, "cache_position": cache_position}
+            key_states, value_states = past_key_values.update(key_states, value_states, self.layer_idx, cache_kwargs)
+        if self.config._attn_implementation == "flash_attention_2" and self.qk_head_dim != self.v_head_dim:
+            value_states = F.pad(value_states, [0, self.qk_head_dim - self.v_head_dim])
+        attention_interface: Callable = eager_attention_forward
+        if self.config._attn_implementation != "eager":
+            attention_interface = ALL_ATTENTION_FUNCTIONS[self.config._attn_implementation]
+        attn_output, attn_weights = attention_interface(
+            self,
+            query_states,
+            key_states,
+            value_states,
+            attention_mask,
+            dropout=0.0 if not self.training else self.attention_dropout,
+            scaling=self.scaling,
+            **kwargs,
+        )
+        if self.config._attn_implementation == "flash_attention_2" and self.qk_head_dim != self.v_head_dim:
+            attn_output = attn_output[:, :, :, : self.v_head_dim]
+        attn_output = attn_output.reshape(batch_size, seq_length, -1).contiguous()
+        attn_output = self.o_proj(attn_output)
+        return attn_output, attn_weights
+class YoutuDecoderLayer(GradientCheckpointingLayer):
+    def __init__(self, config: YoutuConfig, layer_idx: int):
+        super().__init__()
+        self.hidden_size = config.hidden_size
+        self.self_attn = YoutuMLAttention(config=config, layer_idx=layer_idx)
+        self.mlp = YoutuMLP(config)
+        self.input_layernorm = YoutuRMSNorm(config.hidden_size, eps=config.rms_norm_eps)
+        self.post_attention_layernorm = YoutuRMSNorm(config.hidden_size, eps=config.rms_norm_eps)
+    @deprecate_kwarg("past_key_value", new_name="past_key_values", version="4.58")
+    def forward(
+        self,
+        hidden_states: torch.Tensor,
+        attention_mask: Optional[torch.Tensor] = None,
+        position_ids: Optional[torch.LongTensor] = None,
+        past_key_values: Optional[Cache] = None,
+        use_cache: Optional[bool] = False,
+        cache_position: Optional[torch.LongTensor] = None,
+        position_embeddings: Optional[tuple[torch.Tensor, torch.Tensor]] = None,  # necessary, but kept here for BC
+        **kwargs: Unpack[TransformersKwargs],
+    ) -> torch.Tensor:
+        residual = hidden_states
+        hidden_states = self.input_layernorm(hidden_states)
+        # Self Attention
+        hidden_states, _ = self.self_attn(
+            hidden_states=hidden_states,
+            attention_mask=attention_mask,
+            position_ids=position_ids,
+            past_key_values=past_key_values,
+            use_cache=use_cache,
+            cache_position=cache_position,
+            position_embeddings=position_embeddings,
+            **kwargs,
+        )
+        hidden_states = residual + hidden_states
+        # Fully Connected
+        residual = hidden_states
+        hidden_states = self.post_attention_layernorm(hidden_states)
+        hidden_states = self.mlp(hidden_states)
+        hidden_states = residual + hidden_states
+        return hidden_states
+@auto_docstring
+class YoutuPreTrainedModel(PreTrainedModel):
+    config: YoutuConfig
+    base_model_prefix = "model"
+    supports_gradient_checkpointing = True
+    _no_split_modules = ["YoutuDecoderLayer"]
+    _skip_keys_device_placement = ["past_key_values"]
+    _supports_flash_attn = True
+    _supports_sdpa = True
+    _supports_flex_attn = True
+    _can_compile_fullgraph = False
+    _supports_attention_backend = True
+    _can_record_outputs = {
+        "hidden_states": YoutuDecoderLayer,
+        "attentions": YoutuMLAttention,
+    }
+    def init_weights(self):
+        """
+        If needed prunes and maybe initializes weights. If using a custom `PreTrainedModel`, you need to implement any
+        initialization logic in `_init_weights`.
+        """
+        # Prune heads if needed
+        if self.config.pruned_heads:
+            self.prune_heads(self.config.pruned_heads)
+        if "-init" in self.name_or_path:
+            # Initialize weights
+            self.apply(self._initialize_weights)
+            # Adjust weights of o_proj in Attention and down_proj in MLP
+            for name, module in self.named_modules():
+                if "o_proj" in name or "down_proj" in name:
+                    # For the output projection, we reinitialize the weights
+                    scaled_std = self.config.initializer_range * (1.0 / self.config.num_hidden_layers) ** 0.5
+                    module.weight.data.normal_(mean=0.0, std=scaled_std)
+            # Tie weights should be skipped when not initializing all weights
+            # since from_pretrained(...) calls tie weights anyways
+            self.tie_weights()
+    def _init_weights(self, module):
+        super()._init_weights(module)
+        std = self.config.initializer_range
+        embedding_std = self.config.embedding_initializer_range
+        if isinstance(module, nn.Linear):
+            module.weight.data.normal_(mean=0.0, std=std)
+            if module.bias is not None:
+                module.bias.data.zero_()
+        elif isinstance(module, nn.Embedding):
+            module.weight.data.normal_(mean=0.0, std=embedding_std)
+            if module.padding_idx is not None:
+                module.weight.data[module.padding_idx].zero_()
+@auto_docstring
+class YoutuModel(YoutuPreTrainedModel):
+    _keys_to_ignore_on_load_unexpected = [""]
+    def __init__(self, config: YoutuConfig):
+        super().__init__(config)
+        self.padding_idx = config.pad_token_id
+        self.vocab_size = config.vocab_size
+        self.embed_tokens = nn.Embedding(config.vocab_size, config.hidden_size, self.padding_idx)
+        self.layers = nn.ModuleList(
+            [YoutuDecoderLayer(config, layer_idx) for layer_idx in range(config.num_hidden_layers)]
+        )
+        self.norm = YoutuRMSNorm(config.hidden_size, eps=config.rms_norm_eps)
+        self.rotary_emb = YoutuRotaryEmbedding(config=config)
+        self.gradient_checkpointing = False
+        # Initialize weights and apply final processing
+        self.post_init()
+    @check_model_inputs
+    @auto_docstring
+    def forward(
+        self,
+        input_ids: Optional[torch.LongTensor] = None,
+        attention_mask: Optional[torch.Tensor] = None,
+        position_ids: Optional[torch.LongTensor] = None,
+        past_key_values: Optional[Cache] = None,
+        inputs_embeds: Optional[torch.FloatTensor] = None,
+        cache_position: Optional[torch.LongTensor] = None,
+        use_cache: Optional[bool] = None,
+        **kwargs: Unpack[TransformersKwargs],
+    ) -> BaseModelOutputWithPast:
+        if (input_ids is None) ^ (inputs_embeds is not None):
+            raise ValueError("You must specify exactly one of input_ids or inputs_embeds")
+        if inputs_embeds is None:
+            inputs_embeds: torch.Tensor = self.embed_tokens(input_ids)
+        if use_cache and past_key_values is None:
+            past_key_values = DynamicCache(config=self.config)
+        if cache_position is None:
+            past_seen_tokens = past_key_values.get_seq_length() if past_key_values is not None else 0
+            cache_position: torch.Tensor = torch.arange(
+                past_seen_tokens, past_seen_tokens + inputs_embeds.shape[1], device=inputs_embeds.device
+            )
+        if position_ids is None:
+            position_ids = cache_position.unsqueeze(0)
+        causal_mask = create_causal_mask(
+            config=self.config,
+            input_embeds=inputs_embeds,
+            attention_mask=attention_mask,
+            cache_position=cache_position,
+            past_key_values=past_key_values,
+            position_ids=position_ids,
+        )
+        hidden_states = inputs_embeds
+        position_embeddings = self.rotary_emb(hidden_states, position_ids)
+        for decoder_layer in self.layers[: self.config.num_hidden_layers]:
+            hidden_states = decoder_layer(
+                hidden_states,
+                attention_mask=causal_mask,
+                position_ids=position_ids,
+                past_key_values=past_key_values,
+                cache_position=cache_position,
+                position_embeddings=position_embeddings,
+                **kwargs,
+            )
+        hidden_states = self.norm(hidden_states)
+        return BaseModelOutputWithPast(
+            last_hidden_state=hidden_states,
+            past_key_values=past_key_values,
+        )
+@auto_docstring
+class YoutuForCausalLM(YoutuPreTrainedModel, GenerationMixin):
+    _tied_weights_keys = ["lm_head.weight"]
+    _tp_plan = {"lm_head": "colwise_rep"}
+    _pp_plan = {"lm_head": (["hidden_states"], ["logits"])}
+    def __init__(self, config):
+        super().__init__(config)
+        self.model = YoutuModel(config)
+        self.vocab_size = config.vocab_size
+        self.lm_head = nn.Linear(config.hidden_size, config.vocab_size, bias=False)
+        # Initialize weights and apply final processing
+        self.post_init()
+    @can_return_tuple
+    @auto_docstring
+    def forward(
+        self,
+        input_ids: Optional[torch.LongTensor] = None,
+        attention_mask: Optional[torch.Tensor] = None,
+        position_ids: Optional[torch.LongTensor] = None,
+        past_key_values: Optional[Cache] = None,
+        inputs_embeds: Optional[torch.FloatTensor] = None,
+        labels: Optional[torch.LongTensor] = None,
+        use_cache: Optional[bool] = None,
+        cache_position: Optional[torch.LongTensor] = None,
+        logits_to_keep: Union[int, torch.Tensor] = 0,
+        **kwargs: Unpack[TransformersKwargs],
+    ) -> CausalLMOutputWithPast:
+        r"""
+        Example:
+        ```python
+        >>> from transformers import YoutuTokenizer, YoutuForCausalLM
+        >>> model = YoutuForCausalLM.from_pretrained("tencent/Youtu-LLM-2B")
+        >>> tokenizer = YoutuTokenizer.from_pretrained("tencent/Youtu-LLM-2B")
+        >>> prompt = "Hey, are you conscious? Can you talk to me?"
+        >>> inputs = tokenizer(prompt, return_tensors="pt")
+        >>> # Generate
+        >>> generate_ids = model.generate(inputs.input_ids, max_length=30)
+        >>> tokenizer.batch_decode(generate_ids, skip_special_tokens=True, clean_up_tokenization_spaces=False)[0]
+        ```"""
+        outputs: BaseModelOutputWithPast = self.model(
+            input_ids=input_ids,
+            attention_mask=attention_mask,
+            position_ids=position_ids,
+            past_key_values=past_key_values,
+            inputs_embeds=inputs_embeds,
+            use_cache=use_cache,
+            cache_position=cache_position,
+            **kwargs,
+        )
+        hidden_states = outputs.last_hidden_state
+        # Only compute necessary logits, and do not upcast them to float if we are not computing the loss
+        slice_indices = slice(-logits_to_keep, None) if isinstance(logits_to_keep, int) else logits_to_keep
+        logits = self.lm_head(hidden_states[:, slice_indices, :])
+        loss = None
+        if labels is not None:
+            loss = self.loss_function(logits=logits, labels=labels, vocab_size=self.config.vocab_size, **kwargs)
+        return CausalLMOutputWithPast(
+            loss=loss,
+            logits=logits,
+            past_key_values=outputs.past_key_values,
+            hidden_states=outputs.hidden_states,
+            attentions=outputs.attentions,
+        )
+__all__ = ["YoutuPreTrainedModel", "YoutuModel", "YoutuForCausalLM"]

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,23 @@

+{
+    "bos_token": {
+      "content": "<|begin_of_text|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false
+    },
+    "eos_token": {
+      "content": "<|end_of_text|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false
+    },
+    "pad_token": {
+      "content": "<|end_of_text|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false
+    }
+}

tokenizer.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2885591ad59de23306329eb64e179951e6f21ea1a6d1f9dc1dca83cf558ef31c
+size 9353318

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,2064 @@

+{
+  "added_tokens_decoder": {
+    "128000": {
+      "content": "<|begin_of_text|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128001": {
+      "content": "<|end_of_text|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128002": {
+      "content": "<|reserved_special_token_0|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128003": {
+      "content": "<|reserved_special_token_1|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128004": {
+      "content": "<|finetune_right_pad_id|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128005": {
+      "content": "<|reserved_special_token_2|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128006": {
+      "content": "<|start_header_id|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128007": {
+      "content": "<|end_header_id|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128008": {
+      "content": "<|eom_id|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128009": {
+      "content": "<|eot_id|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128010": {
+      "content": "<|python_tag|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128011": {
+      "content": "<|fim_prefix|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128012": {
+      "content": "<|fim_suffix|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128013": {
+      "content": "<|fim_middle|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128014": {
+      "content": "<repo_name>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128015": {
+      "content": "<file_sep>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128016": {
+      "content": "<|reserved_special_token_8|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128017": {
+      "content": "<|reserved_special_token_9|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128018": {
+      "content": "<|trace_context_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128019": {
+      "content": "<|frame_sep|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128020": {
+      "content": "<|call_sep|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128021": {
+      "content": "<|action_sep|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128022": {
+      "content": "<|line_sep|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128023": {
+      "content": "<|return_sep|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128024": {
+      "content": "<|arg_sep|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128025": {
+      "content": "<|trace_context_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128026": {
+      "content": "<|reserved_special_token_18|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128027": {
+      "content": "<|reserved_special_token_19|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128028": {
+      "content": "<|reserved_special_token_20|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128029": {
+      "content": "<|reserved_special_token_21|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128030": {
+      "content": "<|reserved_special_token_22|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128031": {
+      "content": "<|reserved_special_token_23|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128032": {
+      "content": "<|reserved_special_token_24|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128033": {
+      "content": "<|reserved_special_token_25|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128034": {
+      "content": "<|reserved_special_token_26|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128035": {
+      "content": "<|reserved_special_token_27|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128036": {
+      "content": "<|reserved_special_token_28|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128037": {
+      "content": "<|reserved_special_token_29|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128038": {
+      "content": "<|reserved_special_token_30|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128039": {
+      "content": "<|reserved_special_token_31|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128040": {
+      "content": "<|reserved_special_token_32|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128041": {
+      "content": "<|reserved_special_token_33|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128042": {
+      "content": "<|reserved_special_token_34|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128043": {
+      "content": "<|reserved_special_token_35|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128044": {
+      "content": "<|reserved_special_token_36|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128045": {
+      "content": "<|reserved_special_token_37|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128046": {
+      "content": "<|reserved_special_token_38|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128047": {
+      "content": "<|reserved_special_token_39|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128048": {
+      "content": "<|reserved_special_token_40|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128049": {
+      "content": "<|reserved_special_token_41|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128050": {
+      "content": "<|reserved_special_token_42|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128051": {
+      "content": "<|reserved_special_token_43|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128052": {
+      "content": "<|reserved_special_token_44|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128053": {
+      "content": "<|reserved_special_token_45|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128054": {
+      "content": "<|reserved_special_token_46|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128055": {
+      "content": "<|reserved_special_token_47|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128056": {
+      "content": "<|reserved_special_token_48|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128057": {
+      "content": "<|reserved_special_token_49|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128058": {
+      "content": "<|reserved_special_token_50|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128059": {
+      "content": "<|reserved_special_token_51|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128060": {
+      "content": "<|reserved_special_token_52|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128061": {
+      "content": "<|reserved_special_token_53|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128062": {
+      "content": "<|reserved_special_token_54|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128063": {
+      "content": "<|reserved_special_token_55|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128064": {
+      "content": "<|reserved_special_token_56|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128065": {
+      "content": "<|reserved_special_token_57|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128066": {
+      "content": "<|reserved_special_token_58|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128067": {
+      "content": "<|reserved_special_token_59|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128068": {
+      "content": "<|reserved_special_token_60|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128069": {
+      "content": "<|reserved_special_token_61|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128070": {
+      "content": "<|reserved_special_token_62|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128071": {
+      "content": "<|reserved_special_token_63|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128072": {
+      "content": "<|reserved_special_token_64|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128073": {
+      "content": "<|reserved_special_token_65|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128074": {
+      "content": "<|reserved_special_token_66|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128075": {
+      "content": "<|reserved_special_token_67|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128076": {
+      "content": "<|reserved_special_token_68|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128077": {
+      "content": "<|reserved_special_token_69|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128078": {
+      "content": "<|reserved_special_token_70|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128079": {
+      "content": "<|reserved_special_token_71|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128080": {
+      "content": "<|reserved_special_token_72|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128081": {
+      "content": "<|reserved_special_token_73|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128082": {
+      "content": "<|reserved_special_token_74|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128083": {
+      "content": "<|reserved_special_token_75|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128084": {
+      "content": "<|reserved_special_token_76|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128085": {
+      "content": "<|reserved_special_token_77|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128086": {
+      "content": "<|reserved_special_token_78|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128087": {
+      "content": "<|reserved_special_token_79|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128088": {
+      "content": "<|reserved_special_token_80|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128089": {
+      "content": "<|reserved_special_token_81|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128090": {
+      "content": "<|reserved_special_token_82|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128091": {
+      "content": "<|reserved_special_token_83|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128092": {
+      "content": "<|reserved_special_token_84|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128093": {
+      "content": "<|reserved_special_token_85|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128094": {
+      "content": "<|reserved_special_token_86|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128095": {
+      "content": "<|reserved_special_token_87|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128096": {
+      "content": "<|reserved_special_token_88|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128097": {
+      "content": "<|reserved_special_token_89|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128098": {
+      "content": "<|reserved_special_token_90|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128099": {
+      "content": "<|reserved_special_token_91|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128100": {
+      "content": "<|reserved_special_token_92|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128101": {
+      "content": "<|reserved_special_token_93|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128102": {
+      "content": "<|reserved_special_token_94|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128103": {
+      "content": "<|reserved_special_token_95|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128104": {
+      "content": "<|reserved_special_token_96|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128105": {
+      "content": "<|reserved_special_token_97|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128106": {
+      "content": "<|reserved_special_token_98|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128107": {
+      "content": "<|reserved_special_token_99|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128108": {
+      "content": "<|reserved_special_token_100|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128109": {
+      "content": "<|reserved_special_token_101|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128110": {
+      "content": "<|reserved_special_token_102|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128111": {
+      "content": "<|reserved_special_token_103|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128112": {
+      "content": "<|reserved_special_token_104|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128113": {
+      "content": "<|reserved_special_token_105|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128114": {
+      "content": "<|reserved_special_token_106|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128115": {
+      "content": "<|reserved_special_token_107|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128116": {
+      "content": "<|reserved_special_token_108|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128117": {
+      "content": "<|reserved_special_token_109|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128118": {
+      "content": "<|reserved_special_token_110|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128119": {
+      "content": "<|reserved_special_token_111|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128120": {
+      "content": "<|reserved_special_token_112|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128121": {
+      "content": "<|reserved_special_token_113|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128122": {
+      "content": "<|reserved_special_token_114|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128123": {
+      "content": "<|reserved_special_token_115|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128124": {
+      "content": "<|reserved_special_token_116|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128125": {
+      "content": "<|reserved_special_token_117|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128126": {
+      "content": "<|reserved_special_token_118|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128127": {
+      "content": "<|reserved_special_token_119|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128128": {
+      "content": "<|reserved_special_token_120|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128129": {
+      "content": "<|reserved_special_token_121|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128130": {
+      "content": "<|reserved_special_token_122|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128131": {
+      "content": "<|reserved_special_token_123|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128132": {
+      "content": "<|reserved_special_token_124|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128133": {
+      "content": "<|reserved_special_token_125|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128134": {
+      "content": "<|reserved_special_token_126|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128135": {
+      "content": "<|reserved_special_token_127|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128136": {
+      "content": "<|reserved_special_token_128|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128137": {
+      "content": "<|reserved_special_token_129|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128138": {
+      "content": "<|reserved_special_token_130|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128139": {
+      "content": "<|reserved_special_token_131|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128140": {
+      "content": "<|reserved_special_token_132|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128141": {
+      "content": "<|reserved_special_token_133|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128142": {
+      "content": "<|reserved_special_token_134|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128143": {
+      "content": "<|reserved_special_token_135|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128144": {
+      "content": "<|reserved_special_token_136|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128145": {
+      "content": "<|reserved_special_token_137|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128146": {
+      "content": "<|reserved_special_token_138|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128147": {
+      "content": "<|reserved_special_token_139|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128148": {
+      "content": "<|reserved_special_token_140|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128149": {
+      "content": "<|reserved_special_token_141|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128150": {
+      "content": "<|reserved_special_token_142|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128151": {
+      "content": "<|reserved_special_token_143|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128152": {
+      "content": "<|reserved_special_token_144|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128153": {
+      "content": "<|reserved_special_token_145|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128154": {
+      "content": "<|reserved_special_token_146|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128155": {
+      "content": "<|reserved_special_token_147|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128156": {
+      "content": "<|reserved_special_token_148|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128157": {
+      "content": "<|reserved_special_token_149|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128158": {
+      "content": "<|reserved_special_token_150|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128159": {
+      "content": "<|reserved_special_token_151|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128160": {
+      "content": "<|reserved_special_token_152|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128161": {
+      "content": "<|reserved_special_token_153|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128162": {
+      "content": "<|reserved_special_token_154|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128163": {
+      "content": "<|reserved_special_token_155|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128164": {
+      "content": "<|reserved_special_token_156|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128165": {
+      "content": "<|reserved_special_token_157|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128166": {
+      "content": "<|reserved_special_token_158|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128167": {
+      "content": "<|reserved_special_token_159|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128168": {
+      "content": "<|reserved_special_token_160|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128169": {
+      "content": "<|reserved_special_token_161|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128170": {
+      "content": "<|reserved_special_token_162|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128171": {
+      "content": "<|reserved_special_token_163|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128172": {
+      "content": "<|reserved_special_token_164|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128173": {
+      "content": "<|reserved_special_token_165|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128174": {
+      "content": "<|reserved_special_token_166|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128175": {
+      "content": "<|reserved_special_token_167|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128176": {
+      "content": "<|reserved_special_token_168|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128177": {
+      "content": "<|reserved_special_token_169|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128178": {
+      "content": "<|reserved_special_token_170|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128179": {
+      "content": "<|reserved_special_token_171|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128180": {
+      "content": "<|reserved_special_token_172|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128181": {
+      "content": "<|reserved_special_token_173|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128182": {
+      "content": "<|reserved_special_token_174|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128183": {
+      "content": "<|reserved_special_token_175|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128184": {
+      "content": "<|reserved_special_token_176|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128185": {
+      "content": "<|reserved_special_token_177|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128186": {
+      "content": "<|reserved_special_token_178|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128187": {
+      "content": "<|reserved_special_token_179|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128188": {
+      "content": "<|reserved_special_token_180|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128189": {
+      "content": "<|reserved_special_token_181|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128190": {
+      "content": "<|reserved_special_token_182|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128191": {
+      "content": "<|reserved_special_token_183|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128192": {
+      "content": "<|reserved_special_token_184|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128193": {
+      "content": "<|reserved_special_token_185|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128194": {
+      "content": "<|reserved_special_token_186|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128195": {
+      "content": "<|reserved_special_token_187|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128196": {
+      "content": "<|reserved_special_token_188|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128197": {
+      "content": "<|reserved_special_token_189|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128198": {
+      "content": "<|reserved_special_token_190|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128199": {
+      "content": "<|reserved_special_token_191|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128200": {
+      "content": "<|reserved_special_token_192|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128201": {
+      "content": "<|reserved_special_token_193|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128202": {
+      "content": "<|reserved_special_token_194|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128203": {
+      "content": "<|reserved_special_token_195|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128204": {
+      "content": "<|reserved_special_token_196|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128205": {
+      "content": "<|reserved_special_token_197|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128206": {
+      "content": "<|reserved_special_token_198|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128207": {
+      "content": "<|reserved_special_token_199|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128208": {
+      "content": "<|reserved_special_token_200|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128209": {
+      "content": "<|reserved_special_token_201|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128210": {
+      "content": "<|reserved_special_token_202|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128211": {
+      "content": "<|reserved_special_token_203|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128212": {
+      "content": "<|reserved_special_token_204|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128213": {
+      "content": "<|reserved_special_token_205|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128214": {
+      "content": "<|reserved_special_token_206|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128215": {
+      "content": "<|reserved_special_token_207|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128216": {
+      "content": "<|reserved_special_token_208|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128217": {
+      "content": "<|reserved_special_token_209|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128218": {
+      "content": "<|reserved_special_token_210|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128219": {
+      "content": "<|reserved_special_token_211|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128220": {
+      "content": "<|reserved_special_token_212|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128221": {
+      "content": "<|reserved_special_token_213|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128222": {
+      "content": "<|reserved_special_token_214|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128223": {
+      "content": "<|reserved_special_token_215|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128224": {
+      "content": "<|reserved_special_token_216|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128225": {
+      "content": "<|reserved_special_token_217|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128226": {
+      "content": "<|reserved_special_token_218|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128227": {
+      "content": "<think>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "128228": {
+      "content": "</think>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "128229": {
+      "content": "<answer>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "128230": {
+      "content": "</answer>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "128231": {
+      "content": "<|search_begin|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "128232": {
+      "content": "<|search_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "128233": {
+      "content": "<|fim_pad|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "128234": {
+      "content": "<|repo_name|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "128235": {
+      "content": "<|file_sep|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "128236": {
+      "content": "<|User|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "128237": {
+      "content": "<|Assistant|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "128238": {
+      "content": "<|EOT|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "128239": {
+      "content": "<|begin_of_tool_description|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "128240": {
+      "content": "<|end_of_tool_description|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "128241": {
+      "content": "<tools>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "128242": {
+      "content": "</tools>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "128243": {
+      "content": "<|tool_calls_begin|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "128244": {
+      "content": "<|tool_calls_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "128245": {
+      "content": "<|tool_call_begin|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "128246": {
+      "content": "<|tool_call_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "128247": {
+      "content": "<tool_call>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "128248": {
+      "content": "</tool_call>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "128249": {
+      "content": "<|tool_outputs_begin|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "128250": {
+      "content": "<|tool_outputs_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "128251": {
+      "content": "<|tool_output_begin|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "128252": {
+      "content": "<|tool_output_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "128253": {
+      "content": "<tool_response>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "128254": {
+      "content": "</tool_response>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "128255": {
+      "content": "<|tool_sep|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    }
+  },
+  "bos_token": "<|begin_of_text|>",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "<|end_of_text|>",
+  "extra_special_tokens": {},
+  "model_input_names": [
+    "input_ids",
+    "attention_mask"
+  ],
+  "model_max_length": 131072,
+  "pad_token": "<|end_of_text|>",
+  "tokenizer_class": "PreTrainedTokenizerFast",
+  "truncation_side": "left"
+}