IshiKura-a
diff --git a/‎.env.local
Lines changed: 2 additions & 0 deletions b/‎.env.local
Lines changed: 2 additions & 0 deletions
diff --git a/‎.github/ISSUE_TEMPLATE/1-bug-report.yml
Lines changed: 1 addition & 1 deletion b/‎.github/ISSUE_TEMPLATE/1-bug-report.yml
Lines changed: 1 addition & 1 deletion
diff --git a/‎.github/workflows/publish.yml
Lines changed: 1 addition & 6 deletions b/‎.github/workflows/publish.yml
Lines changed: 1 addition & 6 deletions
diff --git a/‎.github/workflows/tests.yml
Lines changed: 35 additions & 3 deletions b/‎.github/workflows/tests.yml
Lines changed: 35 additions & 3 deletions
diff --git a/‎.gitignore
Lines changed: 3 additions & 1 deletion b/‎.gitignore
Lines changed: 3 additions & 1 deletion
diff --git a/‎Makefile
Lines changed: 1 addition & 1 deletion b/‎Makefile
Lines changed: 1 addition & 1 deletion
diff --git a/‎README.md
Lines changed: 54 additions & 25 deletions b/‎README.md
Lines changed: 54 additions & 25 deletions
diff --git a/‎README_zh.md
Lines changed: 55 additions & 25 deletions b/‎README_zh.md
Lines changed: 55 additions & 25 deletions
diff --git a/‎assets/wechat.jpg
2.31 KB b/‎assets/wechat.jpg
2.31 KB
diff --git a/‎assets/wechat_npu.jpg
533 Bytes b/‎assets/wechat_npu.jpg
533 Bytes
diff --git a/‎data/README.md
Lines changed: 5 additions & 4 deletions b/‎data/README.md
Lines changed: 5 additions & 4 deletions
diff --git a/‎data/README_zh.md
Lines changed: 1 addition & 1 deletion b/‎data/README_zh.md
Lines changed: 1 addition & 1 deletion
@@ -16,6 +16,8 @@ USE_MODELSCOPE_HUB=
 USE_OPENMIND_HUB=
 USE_RAY=
 RECORD_VRAM=
+OPTIM_TORCH=
+NPU_JIT_COMPILE=
 # torchrun
 FORCE_TORCHRUN=
 MASTER_ADDR=
 
@@ -12,7 +12,7 @@ body:
     attributes:
       value: |
         Please do not create issues that are not related to framework bugs under this category, use **[Discussions](https://github.com/hiyouga/LLaMA-Factory/discussions/categories/q-a)** instead.
-        请勿在此分类下创建和框架 bug 无关的 issues，请使用 **[讨论区](https://github.com/hiyouga/LLaMA-Factory/discussions/categories/q-a)**。
+        请勿在此分类下创建和框架 bug 无关的 issues，训练问题求助请使用 **[讨论区](https://github.com/hiyouga/LLaMA-Factory/discussions/categories/q-a)**。
 
   - type: checkboxes
     id: reminder
 
@@ -28,14 +28,9 @@ jobs:
         with:
           python-version: "3.9"
 
-      - name: Install dependencies
-        run: |
-          python -m pip install --upgrade pip
-          python -m pip install build
-
       - name: Build package
         run: |
-          python -m build
+          make build
 
       - name: Publish package
         uses: pypa/gh-action-pypi-publish@release/v1
@@ -22,7 +22,7 @@ jobs:
     strategy:
       fail-fast: false
       matrix:
-        python-version:
+        python:
           - "3.9"
           - "3.10"
           - "3.11"
@@ -31,9 +31,22 @@ jobs:
           - "ubuntu-latest"
           - "windows-latest"
           - "macos-13"
+        transformers:
+          - null
+        include:  # test backward compatibility
+          - python: "3.9"
+            os: "ubuntu-latest"
+            transformers: "4.45.0"
+          - python: "3.9"
+            os: "ubuntu-latest"
+            transformers: "4.49.0"
 
     runs-on: ${{ matrix.os }}
 
+    concurrency:
+      group: ${{ github.workflow }}-${{ github.ref }}-${{ matrix.os }}-${{ matrix.python }}-${{ matrix.transformers }}
+      cancel-in-progress: ${{ github.ref != 'refs/heads/main' }}
+
     env:
       HF_TOKEN: ${{ secrets.HF_TOKEN }}
       OS_NAME: ${{ matrix.os }}
@@ -45,15 +58,27 @@ jobs:
       - name: Set up Python
         uses: actions/setup-python@v5
         with:
-          python-version: ${{ matrix.python-version }}
+          python-version: ${{ matrix.python }}
           cache: "pip"
-          cache-dependency-path: "setup.py"
+          cache-dependency-path: "**/requirements*.txt"
 
       - name: Install dependencies
         run: |
           python -m pip install --upgrade pip
           python -m pip install ".[torch,dev]"
 
+      - name: Install transformers
+        if: ${{ matrix.transformers }}
+        run: |
+          python -m pip install "transformers==${{ matrix.transformers }}"
+
+      - name: Cache files
+        id: hf-hub-cache
+        uses: actions/cache@v4
+        with:
+          path: ${{ runner.temp }}/huggingface
+          key: huggingface-${{ matrix.os }}-${{ matrix.python }}-${{ matrix.transformers }}-${{ hashFiles('tests/version.txt') }}
+
       - name: Check quality
         run: |
           make style && make quality
@@ -62,6 +87,13 @@ jobs:
         run: |
           make license
 
+      - name: Check build
+        run: |
+          make build
+
       - name: Test with pytest
         run: |
           make test
+        env:
+          HF_HOME: ${{ runner.temp }}/huggingface
+          HF_HUB_OFFLINE: "${{ steps.hf-hub-cache.outputs.cache-hit == 'true' && '1' || '0' }}"
@@ -185,4 +185,6 @@ test.py
 gen_ans_wo_think.py
 *.code-workspace
 *.xlsx
-templates
+templates
+*.code-workspace
+*.xlsx
@@ -3,7 +3,7 @@
 check_dirs := scripts src tests setup.py
 
 build:
-	pip install build && python -m build
+	pip3 install build && python3 -m build
 
 commit:
 	pre-commit install
 
@@ -4,9 +4,10 @@ Currently we support datasets in **alpaca** and **sharegpt** format.
 
 ```json
 "dataset_name": {
-  "hf_hub_url": "the name of the dataset repository on the Hugging Face hub. (if specified, ignore script_url and file_name)",
-  "ms_hub_url": "the name of the dataset repository on the Model Scope hub. (if specified, ignore script_url and file_name)",
-  "script_url": "the name of the directory containing a dataset loading script. (if specified, ignore file_name)",
+  "hf_hub_url": "the name of the dataset repository on the Hugging Face hub. (if specified, ignore script_url, file_name and cloud_file_name)",
+  "ms_hub_url": "the name of the dataset repository on the Model Scope hub. (if specified, ignore script_url, file_name and cloud_file_name)",
+  "script_url": "the name of the directory containing a dataset loading script. (if specified, ignore file_name and cloud_file_name)",
+  "cloud_file_name": "the name of the dataset file in s3/gcs cloud storage. (if specified, ignore file_name)",
   "file_name": "the name of the dataset folder or dataset file in this directory. (required if above are not specified)",
   "formatting": "the format of the dataset. (optional, default: alpaca, can be chosen from {alpaca, sharegpt})",
   "ranking": "whether the dataset is a preference dataset or not. (default: False)",
@@ -85,7 +86,7 @@ Regarding the above dataset, the *dataset description* in `dataset_info.json` sh
 
 ### Pre-training Dataset
 
-- [Example dataset](c4_demo.json)
+- [Example dataset](c4_demo.jsonl)
 
 In pre-training, only the `text` column will be used for model learning.
 
 
@@ -85,7 +85,7 @@
 
 ### 预训练数据集
 
-- [样例数据集](c4_demo.json)
+- [样例数据集](c4_demo.jsonl)
 
 在预训练时，只有 `text` 列中的内容会用于模型学习。