aeye-lab · SiQube · Mar 25, 2025 · Mar 25, 2025 · dkrako · Mar 25, 2025
@@ -1057,6 +1057,14 @@ def extract(
         )
         return self
 
+    @property
+    def info(self) -> None:
+        """The information about the dataset.
+
+        Print dataset information and citation key.
+        """
+        print(self.definition.info)
+
     @property
     def path(self) -> Path:
         """The path to the dataset directory.

@@ -47,6 +47,9 @@ class DatasetDefinition:
     ----------
     name: str
         The name of the dataset. (default: '.')
+    info: str
+        Information about the dataset including but not limited to original citation,
+        general information. (default: '.')
     has_files: dict[str, bool]
         Indicate whether the dataset contains 'gaze', 'precomputed_events', and
         'precomputed_reading_measures'.
@@ -142,6 +145,9 @@ class DatasetDefinition:
 
     # pylint: disable=too-many-instance-attributes
     name: str = '.'
+
+    info: str = ''
+
     has_files: dict[str, bool] = field(default_factory=dict)
 
     mirrors: dict[str, list[str]] | dict[str, tuple[str, ...]] = field(default_factory=dict)

@@ -31,7 +31,7 @@
 class BSC(DatasetDefinition):
     """BSC dataset :cite:p:`BSC`.
 
-    This dataset includes monocular eye tracking data from a single participant in a single
+    This dataset includes monocular eye tracking data from several participants in a single
     session. Eye movements are recorded at a sampling frequency of 1,000 Hz using an EyeLink 1000
     eye tracker and precomputed events on aoi level are reported.
 
@@ -44,6 +44,10 @@ class BSC(DatasetDefinition):
     name: str
         The name of the dataset.
 
+    info: str
+        Information about the dataset including but not limited to original citation,
+        general information.
+
     has_files: dict[str, bool]
         Indicate whether the dataset contains 'gaze', 'precomputed_events', and
         'precomputed_reading_measures'.
@@ -84,11 +88,11 @@ class BSC(DatasetDefinition):
     Examples
     --------
     Initialize your :py:class:`~pymovements.dataset.Dataset` object with the
-    :py:class:`~pymovements.datasets.SBSAT` definition:
+    :py:class:`~pymovements.datasets.BSC` definition:
 
     >>> import pymovements as pm
     >>>
-    >>> dataset = pm.Dataset("SBSAT", path='data/SBSAT')
+    >>> dataset = pm.Dataset("BSC", path='data/BSC')
 
     Download the dataset resources:
 
@@ -104,6 +108,30 @@ class BSC(DatasetDefinition):
 
     name: str = 'BSC'
 
+    info: str = """\
+BSC dataset :cite:p:`BSC`.
+
+This dataset includes monocular eye tracking data from several participants in a single
+session. Eye movements are recorded at a sampling frequency of 1,000 Hz using an EyeLink 1000
+eye tracker and precomputed events on aoi level are reported.
+
+The participant is instructed to read texts and answer questions.
+
+Check the respective paper for details :cite:p:`BSC`.
+
+If you use the dataset, please cite:
+
+@article{BSC,
+    author={Pan, Jinger and Yan, Ming and Richter, Eike M. and Shu, Hua and Kliegl, Reinhold},
+    title={The {B}eijing {S}entence {C}orpus: A {C}hinese sentence corpus
+    with eye movement data and predictability norms},
+    journal={Behavior Research Methods},
+    year={2022},
+    volume={54},
+    issue={4},
+}
+"""
+
     has_files: dict[str, bool] = field(
         default_factory=lambda: {
             'gaze': False,

@@ -1,5 +1,28 @@
 name: BSC
 
+info: |
+    BSC dataset :cite:p:`BSC`.
+
+    This dataset includes monocular eye tracking data from several participants in a single
+    session. Eye movements are recorded at a sampling frequency of 1,000 Hz using an EyeLink 1000
+    eye tracker and precomputed events on aoi level are reported.
+
+    The participant is instructed to read texts and answer questions.
+
+    Check the respective paper for details :cite:p:`BSC`.
+
+    If you use the dataset, please cite:
+
+    @article{BSC,
+        author={Pan, Jinger and Yan, Ming and Richter, Eike M. and Shu, Hua and Kliegl, Reinhold},
+        title={The {B}eijing {S}entence {C}orpus: A {C}hinese sentence corpus
+        with eye movement data and predictability norms},
+        journal={Behavior Research Methods},
+        year={2022},
+        volume={54},
+        issue={4},
+    }
+
 has_files:
   gaze: false
   precomputed_events: true

@@ -31,7 +31,7 @@
 class BSCII(DatasetDefinition):
     """BSCII dataset :cite:p:`BSCII`.
 
-    This dataset includes monocular eye tracking data from a single participant in a single
+    This dataset includes monocular eye tracking data from several participants in a single
     session. Eye movements are recorded at a sampling frequency of 1,000 Hz using an EyeLink 1000
     eye tracker and precomputed events on aoi level are reported.
 
@@ -45,6 +45,10 @@ class BSCII(DatasetDefinition):
     name: str
         The name of the dataset.
 
+    info: str
+        Information about the dataset including but not limited to original citation,
+        general information.
+
     has_files: dict[str, bool]
         Indicate whether the dataset contains 'gaze', 'precomputed_events', and
         'precomputed_reading_measures'.
@@ -105,6 +109,31 @@ class BSCII(DatasetDefinition):
 
     name: str = 'BSCII'
 
+    info: str = """\
+BSCII dataset :cite:p:`BSCII`.
+
+This dataset includes monocular eye tracking data from several participants in a single
+session. Eye movements are recorded at a sampling frequency of 1,000 Hz using an EyeLink 1000
+eye tracker and precomputed events on aoi level are reported.
+
+The participant is instructed to read texts and answer questions. The original purpose was to
+look into the differences in processing when reading simplified and traditional Chinese.
+
+Check the respective paper for details :cite:p:`BSCII`.
+
+If you use the dataset, please cite:
+
+@article{BSCII,
+    author={Yan, Ming and Pan, Jinger and Kliegl, Reinhold},
+    title={The {B}eijing {S}entence {C}orpus {II}: A cross-script comparison
+    between traditional and simplified Chinese sentence reading},
+    journal={Behavior Research Methods},
+    year={2025},
+    volume={57},
+    issue={2},
+}
+"""
+
     has_files: dict[str, bool] = field(
         default_factory=lambda: {
             'gaze': False,

@@ -1,5 +1,29 @@
 name: "BSCII"
 
+info: |
+    BSCII dataset :cite:p:`BSCII`.
+
+    This dataset includes monocular eye tracking data from several participants in a single
+    session. Eye movements are recorded at a sampling frequency of 1,000 Hz using an EyeLink 1000
+    eye tracker and precomputed events on aoi level are reported.
+
+    The participant is instructed to read texts and answer questions. The original purpose was to
+    look into the differences in processing when reading simplified and traditional Chinese.
+
+    Check the respective paper for details :cite:p:`BSCII`.
+
+    If you use the dataset, please cite:
+
+    @article{BSCII,
+        author={Yan, Ming and Pan, Jinger and Kliegl, Reinhold},
+        title={The {B}eijing {S}entence {C}orpus {II}: A cross-script comparison
+        between traditional and simplified Chinese sentence reading},
+        journal={Behavior Research Methods},
+        year={2025},
+        volume={57},
+        issue={2},
+    }
+
 has_files:
   gaze: false
   precomputed_events: true

@@ -44,6 +44,10 @@ class CodeComprehension(DatasetDefinition):
     name: str
         The name of the dataset.
 
+    info: str
+        Information about the dataset including but not limited to original citation,
+        general information.
+
     has_files: dict[str, bool]
         Indicate whether the dataset contains 'gaze', 'precomputed_events', and
         'precomputed_reading_measures'.
@@ -98,6 +102,36 @@ class CodeComprehension(DatasetDefinition):
 
     name: str = 'CodeComprehension'
 
+    info: str = """\
+CodeComprehension dataset :cite:p:`CodeComprehension`.
+
+This dataset includes eye-tracking-while-code-reading data from participants in a single
+session. Eye movements are recorded at a sampling frequency of 1,000 Hz using an
+EyeLink 1000 eye tracker and are provided as pixel coordinates.
+
+The participant is instructed to read the code snippet and answer a code comprehension question.
+
+If you use the dataset, please cite:
+
+@article{CodeComprehension,
+  author = {Alakmeh, Tarek and Reich, David and J\\"{a}ger, Lena and Fritz, Thomas},
+  title = {Predicting Code Comprehension: A Novel Approach to
+  Align Human Gaze with Code using Deep Neural Networks},
+  year = {2024},
+  issue_date = {July 2024},
+  publisher = {Association for Computing Machinery},
+  address = {New York, NY, USA},
+  volume = {1},
+  number = {FSE},
+  url = {https://doi.org/10.1145/3660795},
+  doi = {10.1145/3660795},
+  journal = {Proc. ACM Softw. Eng.},
+  month = {jul},
+  articleno = {88},
+  numpages = {23},
+}
+"""
+
     has_files: dict[str, bool] = field(
         default_factory=lambda: {
             'gaze': False,

@@ -1,5 +1,34 @@
 name: CodeComprehension
 
+info: |
+    CodeComprehension dataset :cite:p:`CodeComprehension`.
+
+    This dataset includes eye-tracking-while-code-reading data from participants in a single
+    session. Eye movements are recorded at a sampling frequency of 1,000 Hz using an
+    EyeLink 1000 eye tracker and are provided as pixel coordinates.
+
+    The participant is instructed to read the code snippet and answer a code comprehension question.
+
+    If you use the dataset, please cite:
+
+    @article{CodeComprehension,
+      author = {Alakmeh, Tarek and Reich, David and J\"{a}ger, Lena and Fritz, Thomas},
+      title = {Predicting Code Comprehension: A Novel Approach to
+      Align Human Gaze with Code using Deep Neural Networks},
+      year = {2024},
+      issue_date = {July 2024},
+      publisher = {Association for Computing Machinery},
+      address = {New York, NY, USA},
+      volume = {1},
+      number = {FSE},
+      url = {https://doi.org/10.1145/3660795},
+      doi = {10.1145/3660795},
+      journal = {Proc. ACM Softw. Eng.},
+      month = {jul},
+      articleno = {88},
+      numpages = {23},
+    }
+
 has_files:
   gaze: false
   precomputed_events: true