lihuigu commited on
Commit
0b619bd
Β·
1 Parent(s): 23add18

update assets

Browse files
assets/data/test_background.json ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ {"background": "The application scope of large-scale language models such as GPT-4 and LLaMA has rapidly expanded, demonstrating powerful capabilities in natural language processing and multimodal tasks. However, as the size and complexity of the models increase, understanding how they make decisions becomes increasingly difficult. Challenge: 1 The complexity of model interpretation: The billions of parameters and nonlinear decision paths within large-scale language models make it very difficult to track and interpret specific outputs. The existing interpretation methods usually only provide a local perspective and are difficult to systematize. 2. Transparency and Fairness: In specific scenarios, models may exhibit biased or discriminatory behavior. Ensuring the transparency of these models, reducing bias, and providing credible explanations is one of the current challenges."}
2
+ {"background": "Multimodal learning is committed to integrating multiple information sources such as text, images, audio, and video to create more powerful and universal AI models. The research on unified representation aims to find representation methods that can generalize across modalities. Challenge: 1 Modal alignment: There is heterogeneity between different modalities, and how to achieve semantic alignment of these modalities to ensure that the model can comprehensively understand different types of data is a core challenge. 2. Data sparsity and imbalance: There is usually an imbalance in the amount of data in different modalities, such as video and audio data being relatively scarce, while text data is relatively abundant. How to effectively utilize and fuse these modalities to avoid overfitting or underfitting remains a research difficulty.", "cue_words": ["cross-modal embedding", "dat augmentation", "modality-aware fusion", "heterogeneous data integration"]}
assets/data/user_agents.txt ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Mozilla/5.0 (Macintosh; U; Intel Mac OS X 10_6_8; en-us) AppleWebKit/534.50 (KHTML, like Gecko) Version/5.1 Safari/534.50
2
+ Mozilla/5.0 (Windows; U; Windows NT 6.1; en-us) AppleWebKit/534.50 (KHTML, like Gecko) Version/5.1 Safari/534.50
3
+ Mozilla/5.0 (Windows NT 10.0; WOW64; rv:38.0) Gecko/20100101 Firefox/38.0
4
+ Mozilla/5.0 (Windows NT 10.0; WOW64; Trident/7.0; .NET4.0C; .NET4.0E; .NET CLR 2.0.50727; .NET CLR 3.0.30729; .NET CLR 3.5.30729; InfoPath.3; rv:11.0) like Gecko
5
+ Mozilla/5.0 (compatible; MSIE 9.0; Windows NT 6.1; Trident/5.0)
6
+ Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.0; Trident/4.0)
7
+ Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 6.0)
8
+ Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1)
9
+ Mozilla/5.0 (Macintosh; Intel Mac OS X 10.6; rv:2.0.1) Gecko/20100101 Firefox/4.0.1
10
+ Mozilla/5.0 (Windows NT 6.1; rv:2.0.1) Gecko/20100101 Firefox/4.0.1
11
+ Opera/9.80 (Macintosh; Intel Mac OS X 10.6.8; U; en) Presto/2.8.131 Version/11.11
12
+ Opera/9.80 (Windows NT 6.1; U; en) Presto/2.8.131 Version/11.11
13
+ Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_0) AppleWebKit/535.11 (KHTML, like Gecko) Chrome/17.0.963.56 Safari/535.11
14
+ Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 5.1; Maxthon 2.0)
15
+ Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 5.1; TencentTraveler 4.0)
16
+ Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 5.1)
17
+ Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 5.1; The World)
18
+ Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 5.1; Trident/4.0; SE 2.X MetaSr 1.0; SE 2.X MetaSr 1.0; .NET CLR 2.0.50727; SE 2.X MetaSr 1.0)
19
+ Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 5.1; 360SE)
20
+ Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 5.1; Avant Browser)
21
+ Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 5.1)
22
+ Mozilla/5.0 (iPhone; U; CPU iPhone OS 4_3_3 like Mac OS X; en-us) AppleWebKit/533.17.9 (KHTML, like Gecko) Version/5.0.2 Mobile/8J2 Safari/6533.18.5
23
+ Mozilla/5.0 (iPod; U; CPU iPhone OS 4_3_3 like Mac OS X; en-us) AppleWebKit/533.17.9 (KHTML, like Gecko) Version/5.0.2 Mobile/8J2 Safari/6533.18.5
24
+ Mozilla/5.0 (iPad; U; CPU OS 4_3_3 like Mac OS X; en-us) AppleWebKit/533.17.9 (KHTML, like Gecko) Version/5.0.2 Mobile/8J2 Safari/6533.18.5
25
+ Mozilla/5.0 (Linux; U; Android 2.3.7; en-us; Nexus One Build/FRF91) AppleWebKit/533.1 (KHTML, like Gecko) Version/4.0 Mobile Safari/533.1
26
+ MQQBrowser/26 Mozilla/5.0 (Linux; U; Android 2.3.7; zh-cn; MB200 Build/GRJ22; CyanogenMod-7) AppleWebKit/533.1 (KHTML, like Gecko) Version/4.0 Mobile Safari/533.1
27
+ Opera/9.80 (Android 2.3.4; Linux; Opera Mobi/build-1107180945; U; en-GB) Presto/2.8.149 Version/11.10
28
+ Mozilla/5.0 (Linux; U; Android 3.0; en-us; Xoom Build/HRI39) AppleWebKit/534.13 (KHTML, like Gecko) Version/4.0 Safari/534.13
29
+ Mozilla/5.0 (BlackBerry; U; BlackBerry 9800; en) AppleWebKit/534.1+ (KHTML, like Gecko) Version/6.0.0.337 Mobile Safari/534.1+
30
+ Mozilla/5.0 (hp-tablet; Linux; hpwOS/3.0.0; U; en-US) AppleWebKit/534.6 (KHTML, like Gecko) wOSBrowser/233.70 Safari/534.6 TouchPad/1.0
31
+ Mozilla/5.0 (SymbianOS/9.4; Series60/5.0 NokiaN97-1/20.0.019; Profile/MIDP-2.1 Configuration/CLDC-1.1) AppleWebKit/525 (KHTML, like Gecko) BrowserNG/7.1.18124
32
+ Mozilla/5.0 (compatible; MSIE 9.0; Windows Phone OS 7.5; Trident/5.0; IEMobile/9.0; HTC; Titan)
33
+ UCWEB7.0.2.37/28/999
34
+ NOKIA5700/ UCWEB7.0.2.37/28/999
35
+ Openwave/ UCWEB7.0.2.37/28/999
36
+ Mozilla/4.0 (compatible; MSIE 6.0; ) Opera/UCWEB7.0.2.37/28/999
prompt/summarizing.xml DELETED
@@ -1,43 +0,0 @@
1
- <?xml version="1.0" encoding="utf-8"?>
2
- <!DOCTYPE body [
3
- <!ENTITY warning "Warning: Something bad happened... please refresh and try again.">
4
- ]>
5
- <body>
6
- <query rank="0">
7
- <title>User Message</title>
8
- <text>
9
- Task Description:
10
-
11
- You are provided with the title, abstract, and introduction of a research paper. Your task is to generate a concise summary of what kind of problem does this paper aim to solve and what methods are proposed to address it. The summary should follow this format:
12
- The problem of [problem] can be addressed by [main idea/approach].
13
-
14
- Instructions:
15
-
16
- Title: Read the title to understand the general topic of the paper.
17
- Abstract: Read the abstract to get a concise summary of the research, including the problem addressed, the methods used, and the main findings.
18
- Introduction: Read the introduction to gain a deeper understanding of the background, significance, and specific problem the paper addresses, as well as the proposed approach or solution.
19
- Based on the provided information, generate a single sentence that captures the essence of the paper, following the format specified above.
20
-
21
- Your Turn:
22
-
23
- Given the following paper information:
24
- Title: {title}
25
- Abstract: {abstract}
26
- Introduction: {introduction}
27
-
28
- Output:
29
- The problem of [problem] can be addressed by [main idea/approach].
30
- </text>
31
- </query>
32
- <query rank="1">
33
- <title>User Message</title>
34
- <text>
35
- Please read the title, abstract, and introduction of the paper again, as well as the summary you provided. Complete the following two tasks:
36
- 1.Briefly provide the two most critical motivations behind proposing these methods to address the problems.
37
- 2.Briefly provide the three most critical or innovative details of the paper that were not mentioned in your summary (It's best if these details are the new methods or techniques adopted in this paper).
38
-
39
- Output:
40
- Motivations:1.[motivation1]. 2.[motivation2]. Details:1.[detail1]. 2.[detail2]. 3.[detail3].
41
- </text>
42
- </query>
43
- </body>
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
src/config/__init__.py ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ r"""_summary_
2
+ -*- coding: utf-8 -*-
3
+
4
+ Module : config
5
+
6
+ File Name : __init__.py
7
+
8
+ Description : About config.
9
+ for example:
10
+ ```
11
+ from config import ConfigReader
12
+
13
+ config = ConfigReader.load(f, **kwargs)
14
+ ```
15
+
16
+ Creation Date : 2024-10-30
17
+
18
+ Author : Frank Kang([email protected])
19
+ """
20
+ from .reader import ConfigReader
21
+
22
+ __all__ = ['ConfigReader']
configs/config.py β†’ src/config/reader.py RENAMED
@@ -1,13 +1,13 @@
1
  r"""_summary_
2
  -*- coding: utf-8 -*-
3
 
4
- Module : configs.config
5
 
6
- File Name : config.py
7
 
8
  Description : Load the config file, which supports referencing other configuration files. If a circular reference occurs, an exception will be thrown
9
-
10
- Creation Date : 2024-08-18
11
 
12
  Author : Frank Kang([email protected])
13
  """
@@ -57,7 +57,10 @@ def update_config_with_api_aliases(config, llms_api, sum_api, gen_api):
57
  gen_api_found = check_api_alias(config, gen_api)
58
  if gen_api_found is None:
59
  raise KeyError('{} cannot match any llms api in config'.format(gen_api))
60
- config.used_llms_apis = {'summarization': sum_api_found, 'generation': gen_api_found}
 
 
 
61
 
62
 
63
  class ConfigReader:
 
1
  r"""_summary_
2
  -*- coding: utf-8 -*-
3
 
4
+ Module : configs.reader
5
 
6
+ File Name : reader.py
7
 
8
  Description : Load the config file, which supports referencing other configuration files. If a circular reference occurs, an exception will be thrown
9
+
10
+ Creation Date : 2024-07-13
11
 
12
  Author : Frank Kang([email protected])
13
  """
 
57
  gen_api_found = check_api_alias(config, gen_api)
58
  if gen_api_found is None:
59
  raise KeyError('{} cannot match any llms api in config'.format(gen_api))
60
+ config.used_llms_apis = {
61
+ 'summarization': sum_api_found,
62
+ 'generation': gen_api_found
63
+ }
64
 
65
 
66
  class ConfigReader:
{configs β†’ src/config}/utils.py RENAMED
@@ -1,9 +1,19 @@
1
  #!/usr/bin/env python
2
- # coding: utf-8
3
- # Author: Frank Kang
4
- # Data: 13 July 2024
 
 
 
 
 
 
 
 
 
 
5
  import os
6
- ROOT = os.path.dirname(os.path.dirname(__file__))
7
 
8
 
9
  def get_dir(config_dir):
 
1
  #!/usr/bin/env python
2
+ r"""_summary_
3
+ -*- coding: utf-8 -*-
4
+
5
+ Module : configs.utils
6
+
7
+ File Name : utils.py
8
+
9
+ Description : utils about path
10
+
11
+ Creation Date : 2024-07-13
12
+
13
+ Author : Frank Kang([email protected])
14
+ """
15
  import os
16
+ ROOT = os.path.dirname(os.path.dirname(os.path.dirname(__file__)))
17
 
18
 
19
  def get_dir(config_dir):
prompt/prompt_reader.py β†’ src/prompt/reader.py RENAMED
@@ -1,8 +1,17 @@
1
  #!/usr/bin/env python
2
- # coding: utf-8
3
- # Author: Frank Kang
4
- # Data: 16 July 2024
5
 
 
 
 
 
 
 
 
 
 
 
6
  import xml.etree.ElementTree as ET
7
  from xml.etree.ElementTree import Element
8
 
 
1
  #!/usr/bin/env python
2
+ r"""_summary_
3
+ -*- coding: utf-8 -*-
 
4
 
5
+ Module : prompt.reader
6
+
7
+ File Name : reader.py
8
+
9
+ Description : Read prompt template
10
+
11
+ Creation Date : 2024-07-16
12
+
13
+ Author : Frank Kang([email protected])
14
+ """
15
  import xml.etree.ElementTree as ET
16
  from xml.etree.ElementTree import Element
17
 
src/utils/header.py CHANGED
@@ -1,11 +1,20 @@
1
- import sys
2
- import os
3
 
4
- sys.path.append(
5
- os.path.dirname(os.path.dirname(os.path.dirname(os.path.realpath(__file__))))
6
- )
7
- from configs.utils import get_dir
8
- from configs.config import ConfigReader
9
- from prompt.prompt_reader import Prompt, AssistantCreateQuery, MessageQuery
10
 
11
- __all__ = ["get_dir", "ConfigReader", "Prompt", "AssistantCreateQuery", "MessageQuery"]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ r"""_summary_
2
+ -*- coding: utf-8 -*-
3
 
4
+ Module : utils.header
 
 
 
 
 
5
 
6
+ File Name : header.py
7
+
8
+ Description : import some modules from top-level package
9
+
10
+ Creation Date : 2024-07-16
11
+
12
+ Author : Frank Kang([email protected])
13
+ """
14
+ from config.utils import get_dir
15
+ from config import ConfigReader
16
+ from prompt.reader import Prompt, AssistantCreateQuery, MessageQuery
17
+
18
+ __all__ = [
19
+ "get_dir", "ConfigReader", "Prompt", "AssistantCreateQuery", "MessageQuery"
20
+ ]