update

meta-tabchen · meta-tabchen · commit 4547cf86236e · 2022-06-08T18:13:38.000+08:00
diff --git a/.gitignore b/.gitignore
@@ -13,4 +13,5 @@ dist/
 *.pyc
 docs/
 *.pkl
-saved_model
+saved_model
+build/
diff --git a/README.md b/README.md
@@ -7,7 +7,7 @@ PyKT is a python library build upon PyTorch to train deep learning based knowled
 Use the following command to install PyKY:
 
 ```
-pip install -U pykt-toolkit
+pip install -U pykt-toolkit -i  https://pypi.python.org/simple 
 ```
 
 <!-- 
diff --git a/build.sh b/build.sh
@@ -1,3 +1,3 @@
-rm -r dist
 python -m build
-twine upload dist/*
+twine upload dist/*
+rm -r dist
diff --git a/pykt/datasets/data_loader.py b/pykt/datasets/data_loader.py
@@ -8,21 +8,29 @@
 from torch.cuda import FloatTensor, LongTensor
 import numpy as np
 
+
+
 class KTDataset(Dataset):
     """Dataset for KT
         can use to init dataset for: (for models except dkt_forget)
             train data, valid data
             common test data(concept level evaluation), real educational scenario test data(question level evaluation).
+
+    Args:
+        file_path (str): train_valid/test file path
+        input_type (list[str]): the input type of the dataset, values are in ["questions", "concepts"]
+        folds (set(int)): the folds used to generate dataset, -1 for test data
+        qtest (bool, optional): is question evaluation or not. Defaults to False.
     """
     def __init__(self, file_path, input_type, folds, qtest=False):
-        """init KTDataset
-
-        Args:
-            file_path (str): train_valid/test file path
-            input_type (list[str]): the input type of the dataset, values are in ["questions", "concepts"]
-            folds (set(int)): the folds used to generate dataset, -1 for test data
-            qtest (bool, optional): is question evaluation or not. Defaults to False.
-        """
+        # """init KTDataset
+
+        # Args:
+        #     file_path (str): train_valid/test file path
+        #     input_type (list[str]): the input type of the dataset, values are in ["questions", "concepts"]
+        #     folds (set(int)): the folds used to generate dataset, -1 for test data
+        #     qtest (bool, optional): is question evaluation or not. Defaults to False.
+        # """
         super(KTDataset, self).__init__()
         sequence_path = file_path
         self.input_type = input_type
@@ -65,6 +73,7 @@ def __getitem__(self, index):
             index (int): the index of the data want to get
 
         Returns:
+        (tuple): tuple containing:
             q_seqs (torch.tensor): question id sequence of the 0~seqlen-2 interactions
             c_seqs (torch.tensor): knowledge concept id sequence of the 0~seqlen-2 interactions
             r_seqs (torch.tensor): response id sequence of the 0~seqlen-2 interactions
@@ -95,6 +104,8 @@ def __getitem__(self, index):
                 dcur[key] = self.dqtest[key][index]
             return q_seqs, c_seqs, r_seqs, qshft_seqs, cshft_seqs, rshft_seqs, mask_seqs, select_masks, dcur
 
+
+
     def load_data(self, sequence_path, folds, pad_val=-1):
         """load data
 
@@ -103,14 +114,19 @@ def load_data(self, sequence_path, folds, pad_val=-1):
             folds (list[int]): 
             pad_val (int, optional): pad value. Defaults to -1.
 
-        Returns:
-            q_seqs (torch.tensor): question id sequence of the 0~seqlen-1 interactions
-            c_seqs (torch.tensor): knowledge concept id sequence of the 0~seqlen-1 interactions
-            r_seqs (torch.tensor): response id sequence of the 0~seqlen-1 interactions
-            mask_seqs (torch.tensor): masked value sequence, shape is seqlen-1
-            select_masks (torch.tensor): is select to calculate the performance or not, 0 is not selected, 1 is selected, only available for 1~seqlen-1, shape is seqlen-1
-            dqtest (dict): not null only self.qtest is True, for question level evaluation
+        Returns: 
+            (tuple): tuple containing
+
+            - **q_seqs (torch.tensor)**: question id sequence of the 0~seqlen-1 interactions
+            - c_seqs (torch.tensor): knowledge concept id sequence of the 0~seqlen-1 interactions
+            - r_seqs (torch.tensor): response id sequence of the 0~seqlen-1 interactions
+            - mask_seqs (torch.tensor): masked value sequence, shape is seqlen-1
+            - select_masks (torch.tensor): is select to calculate the performance or not, 0 is not selected, 1 is selected, only available for 1~seqlen-1, shape is seqlen-1
+            - dqtest (dict): not null only self.qtest is True, for question level evaluation
+
+
         """
+
         seq_qids, seq_cids, seq_rights, seq_mask = [], [], [], []
         df = pd.read_csv(sequence_path)
         df = df[df["fold"].isin(folds)]