-
Notifications
You must be signed in to change notification settings - Fork 1
/
index.html
40 lines (40 loc) · 13.5 KB
/
index.html
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
<!DOCTYPE html>
<html>
<head>
<meta charset="UTF-8">
<meta name="viewport" content="width=device-width, initial-scale=1.0">
<meta http-equiv="X-UA-Compatible" content="ie=edge">
<title>Markmap</title>
<style>
* {
margin: 0;
padding: 0;
}
#mindmap {
display: block;
width: 100vw;
height: 100vh;
}
</style>
<link rel="stylesheet" href="https://cdn.jsdelivr.net/npm/markmap-toolbar@0.15.3/dist/style.css">
</head>
<body>
<svg id="mindmap"></svg>
<script src="https://cdn.jsdelivr.net/npm/d3@7.8.5/dist/d3.min.js"></script><script src="https://cdn.jsdelivr.net/npm/markmap-view@0.15.3/dist/browser/index.js"></script><script src="https://cdn.jsdelivr.net/npm/markmap-toolbar@0.15.3/dist/index.js"></script><script>(r => {
setTimeout(r);
})(() => {
const {
markmap,
mm
} = window;
const {
el
} = markmap.Toolbar.create(mm);
el.setAttribute('style', 'position:absolute;bottom:20px;right:20px');
document.body.append(el);
})</script><script>((getMarkmap, getOptions, root, jsonOptions) => {
const markmap = getMarkmap();
window.mm = markmap.Markmap.create('svg#mindmap', (getOptions || markmap.deriveOptions)(jsonOptions), root);
})(() => window.markmap,null,{"type":"heading","depth":0,"payload":{"lines":[0,1]},"content":"NLP","children":[{"type":"heading","depth":1,"payload":{"lines":[2,3]},"content":"<a href=\"https://arxiv.org/abs/1409.0473\">Bahdanau attention</a>","children":[]},{"type":"heading","depth":1,"payload":{"lines":[4,5]},"content":"<a href=\"https://arxiv.org/abs/1508.04025\">Luong attention</a>","children":[]},{"type":"heading","depth":1,"payload":{"lines":[6,7]},"content":"<a href=\"https://arxiv.org/abs/1608.05859\">Weight tying</a>","children":[]},{"type":"heading","depth":1,"payload":{"lines":[8,9]},"content":"<a href=\"https://arxiv.org/abs/1706.03762\">Transformer</a>","children":[{"type":"heading","depth":2,"payload":{"lines":[10,11]},"content":"Encoder-Only <a href=\"https://arxiv.org/abs/1810.04805\">BERT</a>","children":[{"type":"list_item","depth":3,"payload":{"lines":[11,12]},"content":"성능 향상","children":[{"type":"list_item","depth":4,"payload":{"lines":[12,13]},"content":"<a href=\"https://arxiv.org/abs/1907.11692\">RoBERTa</a>","children":[]},{"type":"list_item","depth":4,"payload":{"lines":[13,14]},"content":"<a href=\"https://arxiv.org/abs/2007.14062\">Big Bird</a>","children":[]},{"type":"list_item","depth":4,"payload":{"lines":[14,15]},"content":"<a href=\"https://arxiv.org/abs/1906.08237\">XLNet</a>","children":[]},{"type":"list_item","depth":4,"payload":{"lines":[15,16]},"content":"<a href=\"https://arxiv.org/abs/2003.10555\">ELECTRA</a>","children":[]},{"type":"list_item","depth":4,"payload":{"lines":[16,17]},"content":"<a href=\"https://arxiv.org/abs/1907.10529\">SpanBERT</a>","children":[]}]},{"type":"list_item","depth":3,"payload":{"lines":[18,19]},"content":"domain 적용","children":[{"type":"list_item","depth":4,"payload":{"lines":[19,20]},"content":"<a href=\"https://arxiv.org/abs/1901.08746\">BioBERT</a>","children":[]},{"type":"list_item","depth":4,"payload":{"lines":[20,21]},"content":"<a href=\"https://arxiv.org/abs/2103.04475\">LogBERT</a>","children":[]},{"type":"list_item","depth":4,"payload":{"lines":[21,22]},"content":"<a href=\"https://arxiv.org/abs/1904.05342\">ClinicalBERT</a>","children":[]}]},{"type":"list_item","depth":3,"payload":{"lines":[23,24]},"content":"경량화","children":[{"type":"list_item","depth":4,"payload":{"lines":[24,25]},"content":"<a href=\"https://arxiv.org/abs/1910.01108\">DistilBERT</a>","children":[]},{"type":"list_item","depth":4,"payload":{"lines":[25,26]},"content":"<a href=\"https://arxiv.org/abs/1909.11942\">ALBERT</a>","children":[]}]}]},{"type":"heading","depth":2,"payload":{"lines":[28,29]},"content":"Decoder-Only <a href=\"https://openai.com/research/language-unsupervised\">GPT-1</a>","children":[{"type":"list_item","depth":3,"payload":{"lines":[29,30]},"content":"<a href=\"https://d4mucfpksywv.cloudfront.net/better-language-models/language-models.pdf\">GPT-2</a>","children":[{"type":"list_item","depth":4,"payload":{"lines":[30,31]},"content":"<a href=\"https://arxiv.org/abs/2005.14165\">GPT-3</a>","children":[{"type":"list_item","depth":5,"payload":{"lines":[31,32]},"content":"Self-Instruction","children":[{"type":"list_item","depth":6,"payload":{"lines":[32,33]},"content":"<a href=\"https://arxiv.org/abs/2212.10560\">Self-Instruct</a>","children":[]}]},{"type":"list_item","depth":5,"payload":{"lines":[33,34]},"content":"Open Access","children":[{"type":"list_item","depth":6,"payload":{"lines":[34,35]},"content":"<a href=\"https://arxiv.org/abs/2302.13971\">LLAMA</a>","children":[{"type":"list_item","depth":7,"payload":{"lines":[35,36]},"content":"Instruction-follwing","children":[{"type":"list_item","depth":8,"payload":{"lines":[36,37]},"content":"<a href=\"https://crfm.stanford.edu/2023/03/13/alpaca.html\">Alpaca</a>","children":[]},{"type":"list_item","depth":8,"payload":{"lines":[37,38]},"content":"<a href=\"https://arxiv.org/abs/2305.11206\">LIMA</a>","children":[]}]}]},{"type":"list_item","depth":6,"payload":{"lines":[38,39]},"content":"<a href=\"https://arxiv.org/abs/2211.05100\">BLOOM</a>","children":[{"type":"list_item","depth":7,"payload":{"lines":[39,40]},"content":"<a href=\"https://arxiv.org/abs/2211.01786\">BLOOMZ</a>","children":[]}]}]},{"type":"list_item","depth":5,"payload":{"lines":[40,41]},"content":"RLHF (Reinformcement Learning Human Feedback)","children":[{"type":"list_item","depth":6,"payload":{"lines":[41,42]},"content":"<a href=\"https://arxiv.org/abs/2203.02155\">InstructGPT</a>","children":[{"type":"list_item","depth":7,"payload":{"lines":[42,43]},"content":"<a href=\"https://arxiv.org/abs/2303.08774\">GPT-4</a>","children":[]}]}]},{"type":"list_item","depth":5,"payload":{"lines":[43,44]},"content":"<a href=\"https://arxiv.org/abs/2204.02311\">PALM</a>","children":[{"type":"list_item","depth":6,"payload":{"lines":[44,45]},"content":"<a href=\"https://ai.google/static/documents/palm2techreport.pdf\">PALM2</a>","children":[]},{"type":"list_item","depth":6,"payload":{"lines":[45,46]},"content":"<a href=\"https://arxiv.org/abs/2210.11416\">Flan-PALM</a>","children":[]}]}]}]}]},{"type":"heading","depth":2,"payload":{"lines":[47,48]},"content":"Encoder-Decoder <a href=\"https://arxiv.org/abs/1910.13461\">BART</a>","children":[{"type":"list_item","depth":3,"payload":{"lines":[48,49]},"content":"성능 향상","children":[{"type":"list_item","depth":4,"payload":{"lines":[49,50]},"content":"<a href=\"https://arxiv.org/abs/1910.10683\">T5</a>","children":[{"type":"list_item","depth":5,"payload":{"lines":[50,51]},"content":"<a href=\"https://arxiv.org/abs/2210.11416\">FLAN-T5</a>","children":[]},{"type":"list_item","depth":5,"payload":{"lines":[51,52]},"content":"<a href=\"https://arxiv.org/abs/2110.08207\">T0</a>","children":[]}]}]},{"type":"list_item","depth":3,"payload":{"lines":[52,53]},"content":"multimodal","children":[{"type":"list_item","depth":4,"payload":{"lines":[53,54]},"content":"<a href=\"https://arxiv.org/abs/2206.06336\">METALM</a>","children":[{"type":"list_item","depth":5,"payload":{"lines":[54,55]},"content":"<a href=\"https://arxiv.org/abs/2302.14045\">KOSMOS-1</a>","children":[]}]},{"type":"list_item","depth":4,"payload":{"lines":[55,56]},"content":"<a href=\"https://arxiv.org/abs/2204.14198\">Flamingo</a>","children":[]}]}]},{"type":"heading","depth":2,"payload":{"lines":[58,59]},"content":"Transformer 구조 수정","children":[{"type":"list_item","depth":3,"payload":{"lines":[59,60]},"content":"Layernorm + initialization","children":[{"type":"list_item","depth":4,"payload":{"lines":[60,61]},"content":"<a href=\"https://arxiv.org/abs/2203.00555\">DeepNet</a>","children":[]},{"type":"list_item","depth":4,"payload":{"lines":[61,62]},"content":"<a href=\"https://arxiv.org/abs/2210.06423\">MAGNETO</a>","children":[]}]},{"type":"list_item","depth":3,"payload":{"lines":[62,63]},"content":"Self-attention 관련","children":[{"type":"list_item","depth":4,"payload":{"lines":[63,64]},"content":"<a href=\"https://arxiv.org/abs/2001.04451\">Reformer</a>","children":[]},{"type":"list_item","depth":4,"payload":{"lines":[64,65]},"content":"<a href=\"https://arxiv.org/abs/1803.02155\">Relative positional encoding</a>","children":[]},{"type":"list_item","depth":4,"payload":{"lines":[65,66]},"content":"<a href=\"https://arxiv.org/abs/2004.05150\">Longformer</a>","children":[]},{"type":"list_item","depth":4,"payload":{"lines":[66,67]},"content":"<a href=\"https://arxiv.org/abs/2105.03824\">FNet</a>","children":[]}]}]},{"type":"heading","depth":2,"payload":{"lines":[68,69]},"content":"LM with External Knowledge","children":[{"type":"list_item","depth":3,"payload":{"lines":[69,70]},"content":"with Document","children":[{"type":"list_item","depth":4,"payload":{"lines":[70,71]},"content":"<a href=\"https://arxiv.org/abs/2004.04906\">DPR</a>","children":[{"type":"list_item","depth":5,"payload":{"lines":[71,72]},"content":"<a href=\"https://arxiv.org/abs/2112.09118\">Contriever</a>","children":[]},{"type":"list_item","depth":5,"payload":{"lines":[72,73]},"content":"<a href=\"https://arxiv.org/abs/2306.02516\">SamToNe</a>","children":[]}]},{"type":"list_item","depth":4,"payload":{"lines":[73,74]},"content":"<a href=\"https://arxiv.org/abs/2108.13817\">ORQA</a>","children":[{"type":"list_item","depth":5,"payload":{"lines":[74,75]},"content":"<a href=\"https://arxiv.org/abs/2002.08909\">REALM</a>","children":[{"type":"list_item","depth":6,"payload":{"lines":[75,76]},"content":"Reader -> Generator <a href=\"https://arxiv.org/abs/2005.11401\">RAG</a>","children":[{"type":"list_item","depth":7,"payload":{"lines":[76,77]},"content":"<a href=\"https://arxiv.org/abs/2207.06300\">Re2G</a>","children":[]},{"type":"list_item","depth":7,"payload":{"lines":[77,78]},"content":"<a href=\"https://arxiv.org/abs/2007.01282\">FiD</a>","children":[]},{"type":"list_item","depth":7,"payload":{"lines":[78,79]},"content":"<a href=\"https://arxiv.org/abs/2208.03299\">Atlas</a>","children":[]},{"type":"list_item","depth":7,"payload":{"lines":[79,80]},"content":"<a href=\"https://arxiv.org/abs/2301.12652\">REPLUG</a>","children":[]},{"type":"list_item","depth":7,"payload":{"lines":[80,81]},"content":"<a href=\"https://arxiv.org/abs/2305.17080\">EAR</a>","children":[]}]}]}]}]},{"type":"list_item","depth":3,"payload":{"lines":[82,83]},"content":"with KG","children":[{"type":"list_item","depth":4,"payload":{"lines":[83,84]},"content":"<a href=\"https://arxiv.org/abs/2305.12416\">DiFaR</a>","children":[]},{"type":"list_item","depth":4,"payload":{"lines":[84,85]},"content":"<a href=\"https://aclanthology.org/2021.eacl-main.26/\">Retrieve-Rerank Framework</a>","children":[]}]},{"type":"list_item","depth":3,"payload":{"lines":[86,87]},"content":"Document + KG","children":[{"type":"list_item","depth":4,"payload":{"lines":[87,88]},"content":"<a href=\"https://arxiv.org/abs/2012.14610\">UniK-QA</a>","children":[]}]}]}]},{"type":"heading","depth":1,"payload":{"lines":[91,92]},"content":"Benchmark","children":[{"type":"heading","depth":2,"payload":{"lines":[92,93]},"content":"<a href=\"https://arxiv.org/abs/1804.07461\">GLUE</a>","children":[{"type":"list_item","depth":3,"payload":{"lines":[93,94]},"content":"<a href=\"https://arxiv.org/abs/1606.05250\">SQuAD</a>","children":[]},{"type":"list_item","depth":3,"payload":{"lines":[94,95]},"content":"<a href=\"https://arxiv.org/abs/1905.00537\">SuperGLUE</a>","children":[]}]},{"type":"heading","depth":2,"payload":{"lines":[96,97]},"content":"<a href=\"https://arxiv.org/abs/1806.08730\">DecaNLP</a>","children":[]},{"type":"heading","depth":2,"payload":{"lines":[98,99]},"content":"<a href=\"https://arxiv.org/abs/2206.04615\">BIG-Bench</a>","children":[]},{"type":"heading","depth":2,"payload":{"lines":[100,101]},"content":"<a href=\"https://arxiv.org/abs/2204.07705\">SUPER-NATURALINSTRUCTIONS</a>","children":[]},{"type":"heading","depth":2,"payload":{"lines":[102,103]},"content":"<a href=\"https://arxiv.org/abs/2009.03300\">MMLU</a>","children":[]},{"type":"heading","depth":2,"payload":{"lines":[104,105]},"content":"Knowledge-Intensive Task","children":[{"type":"list_item","depth":3,"payload":{"lines":[105,106]},"content":"<a href=\"https://arxiv.org/abs/2009.02252\">KILT</a>","children":[{"type":"list_item","depth":4,"payload":{"lines":[106,107]},"content":"<a href=\"https://arxiv.org/abs/1803.05355\">FEVER</a>","children":[]}]},{"type":"list_item","depth":3,"payload":{"lines":[107,108]},"content":"<a href=\"https://arxiv.org/abs/2104.08663\">BEIR</a>","children":[]}]}]},{"type":"heading","depth":1,"payload":{"lines":[110,111]},"content":"Effficient Training","children":[{"type":"list_item","depth":2,"payload":{"lines":[111,112]},"content":"<a href=\"https://arxiv.org/abs/1710.03740\">Mixed Precision</a>","children":[]},{"type":"list_item","depth":2,"payload":{"lines":[112,113]},"content":"Distributed learning","children":[{"type":"list_item","depth":3,"payload":{"lines":[113,114]},"content":"<a href=\"https://arxiv.org/abs/1909.08053\">Megatron-LM</a>","children":[]},{"type":"list_item","depth":3,"payload":{"lines":[114,115]},"content":"<a href=\"https://arxiv.org/abs/1910.02054\">Zero</a>","children":[{"type":"list_item","depth":4,"payload":{"lines":[115,116]},"content":"<a href=\"https://arxiv.org/abs/2104.07857\">Zero-Infinity</a>","children":[]}]}]},{"type":"list_item","depth":2,"payload":{"lines":[116,117]},"content":"<a href=\"https://arxiv.org/abs/2106.09685\">LoRA</a>","children":[]},{"type":"list_item","depth":2,"payload":{"lines":[117,118]},"content":"<a href=\"https://arxiv.org/abs/2104.08691\">Prompt Tuning</a>","children":[]}]}]},{"colorFreezeLevel":10,"maxWidth":800})</script>
</body>
</html>