File size: 1,463 Bytes
33adc14
 
 
 
 
527151b
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
33adc14
 
 
 
527151b
33adc14
 
527151b
 
 
 
 
33adc14
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
retriever:
  retriever_hf_paths:
    RAGatouille: "XThomasBU/Colbert_Index"

metadata:
  metadata_links:
    [
      "https://dl4ds.github.io/sp2025/",
      "https://dl4ds.github.io/sp2025/schedule/",
    ]
  slide_base_link:
    "https://dl4ds.github.io"

    # Assignment base link is used to find the webpage where the assignment is described/posted
  assignment_base_link: "https://tools4ds.github.io/fa2024/assignments/"

  # Define content types - assignments, lectures, etc.
  content_types:
    - "lectures"
    - "assignments"
    - "discussion"
    - "other"

  # These need to be patterns from URLs that can be used to identify the type of content uniquely
  lectures_pattern: "/lectures/"
  assignments_pattern: "/assignments/"
  discussion_pattern: "/discussion/"
  project_pattern: "/project/"

  # These are fields that can be extracted from the webpages of the course content
  lecture_metadata_fields:
    - "title"
    - "tldr"
    - "date"
    - "lecture_recording"
    - "suggested_readings"

  assignment_metadata_fields:
    - "title"
    - "release_date"
    - "due_date"
    - "source_file"

token_config:
  cooldown_time: 60
  regen_time: 180
  tokens_left: 50000
  all_time_tokens_allocated: 1000000

content:
  notebookheaders_to_split_on:
    - ["##", "Section"]
    - ["#", "Title"]

misc:
  github_repo: "https://github.com/edubotics-ai/edubot-core"
  docs_website: "https://dl4ds.github.io/dl4ds_tutor/"

api_config:
  timeout: 60