File size: 1,340 Bytes
6b7fe9a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
<?xml version="1.0" encoding="UTF-8"?>
<metadata>
  <identifier>gpt4chan_model</identifier>
  <collection>imageboard_datasets</collection>
  <licenseurl>https://www.apache.org/licenses/LICENSE-2.0</licenseurl>
  <scanner>Internet Archive Python library 3.0.1</scanner>
  <mediatype>data</mediatype>
  <uploader>valentino.giudice96@gmail.com</uploader>
  <title> GPT-4chan Model</title>
  <publicdate>2022-06-07 01:56:14</publicdate>
  <addeddate>2022-06-07 01:56:14</addeddate>
  <curation>[curator]validator@archive.org[/curator][date]20220607020703[/date][comment]checked for malware[/comment]</curation>
  <creator> Yannic Kilcher</creator>
  <description>&lt;div&gt;&lt;div&gt;GPT-4chan is a language model fine-tuned from &lt;a href="https://huggingface.co/EleutherAI/gpt-j-6B" rel="nofollow"&gt;GPT-J 6B&lt;/a&gt; on 3.5 years worth of data from 4chan's politically incorrect (/pol/) board, as included in the dataset &lt;span style="border-style:solid;border-color:rgb(229,231,235);"&gt;&lt;a href="https://zenodo.org/record/3606810" rel="nofollow"&gt;Raiders of the Lost Kek: 3.5 Years of Augmented 4chan Posts from the Politically Incorrect Board&lt;/a&gt;&lt;/span&gt;.&lt;/div&gt;&lt;/div&gt;</description>
  <publisher> Yannic Kilcher</publisher>
  <language>English</language>
  <collection>datasets</collection>
</metadata>