metacritical commited on
Commit
1cb8f7f
·
verified ·
1 Parent(s): ecc40f6
Files changed (1) hide show
  1. index.html +111 -66
index.html CHANGED
@@ -1,80 +1,125 @@
1
  <!DOCTYPE html>
2
- <html lang="en">
3
  <head>
4
- <meta charset="UTF-8">
5
- <meta name="viewport" content="width=device-width, initial-scale=1.0">
6
- <title>DeepSeek Papers</title>
7
- <link rel="stylesheet" href="styles.css">
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
8
  </head>
9
  <body>
10
- <header>
11
- <h1>DeepSeek Papers</h1>
12
- </header>
13
-
14
- <main>
15
- <section>
16
- <h2>DeepSeek Papers</h2>
17
 
18
- <article>
19
- <h3>1. <strong>DeepSeek LLM: Scaling Open-Source Language Models with Longtermism</strong></h3>
20
- <p>Description: Scaling open-source language models with a focus on longtermism.</p>
21
- <ul>
22
- <li><a href="https://huggingface.co/papers/2401.02954">Link to Paper</a> {Jan 6, 2024}</li>
23
- </ul>
24
- </article>
 
 
 
 
 
 
 
25
 
26
- <article>
27
- <h3>2. <strong>DeepSeekMoE: Towards Ultimate Expert Specialization in Mixture-of-Experts Language Models</strong></h3>
28
- <p>Description: Exploring expert specialization in Mixture-of-Experts language models.</p>
29
- <ul>
30
- <li><a href="https://arxiv.org/abs/2401.06066">Link to Paper</a> {Jan 11, 2024}</li>
31
- </ul>
32
- </article>
 
 
33
 
34
- <article>
35
- <h3>3. <strong>DeepSeek-Coder: When the Large Language Model Meets Programming -- The Rise of Code Intelligence</strong></h3>
36
- <p>Description: Investigating the intersection of large language models and programming.</p>
37
- <ul>
38
- <li><a href="https://arxiv.org/abs/2401.14196">Link to Paper</a> {Jan 25, 2024}</li>
39
- </ul>
40
- </article>
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
41
 
42
- <!-- Repeat for the remaining papers -->
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
43
 
44
- <article>
45
- <h3>17. <strong>Native Sparse Attention: Hardware-Aligned and Natively Trainable Sparse Attention</strong></h3>
46
- <p>Description: Hardware-Aligned and Natively Trainable Sparse Attention.</p>
47
- <ul>
48
- <li><a href="https://arxiv.org/abs/2502.11089">Link to Paper</a> {Feb 16, 2025}</li>
49
- </ul>
50
- </article>
51
- </section>
52
 
53
- <section>
54
- <h2>Related Links</h2>
55
- <p>There's a lot of excellent work being done in the field of AI and machine learning. For more information, check out these resources:</p>
56
- <ul>
57
- <li><a href="https://huggingface.co/papers">Hugging Face Papers</a></li>
58
- <li><a href="https://arxiv.org">arXiv.org</a></li>
59
- </ul>
60
- </section>
61
 
62
- <section>
63
- <h2>BibTeX</h2>
64
- <pre><code class="bibtex">
65
- @article{deepseek2024papers,
66
- author = {DeepSeek Research Team},
67
- title = {DeepSeek Papers: Advancements in Language Models and Multimodal Understanding},
68
- journal = {DeepSeek Publications},
69
- year = {2024-2025},
70
- }
71
- </code></pre>
72
- </section>
73
- </main>
74
 
75
- <footer>
76
- <p>This website is licensed under a <a href="https://creativecommons.org/licenses/by-sa/4.0/">Creative Commons Attribution-ShareAlike 4.0 International License</a>.</p>
77
- <p>This means you are free to borrow the <a href="source-code-link">source code</a> of this website; we just ask that you link back to this page in the footer. Please remember to remove the analytics code included in the header of the website which you do not want on your website.</p>
78
- </footer>
79
  </body>
80
  </html>
 
1
  <!DOCTYPE html>
2
+ <html>
3
  <head>
4
+ <meta charset="utf-8">
5
+ <meta name="description"
6
+ content="A collection of research papers from DeepSeek.">
7
+ <meta name="keywords" content="DeepSeek, AI Research, Machine Learning">
8
+ <meta name="viewport" content="width=device-width, initial-scale=1">
9
+ <title>DeepSeek Research Papers</title>
10
+
11
+ <link href="https://fonts.googleapis.com/css?family=Google+Sans|Noto+Sans|Castoro"
12
+ rel="stylesheet">
13
+
14
+ <link rel="stylesheet" href="./static/css/bulma.min.css">
15
+ <link rel="stylesheet" href="./static/css/bulma-carousel.min.css">
16
+ <link rel="stylesheet" href="./static/css/bulma-slider.min.css">
17
+ <link rel="stylesheet" href="./static/css/fontawesome.all.min.css">
18
+ <link rel="stylesheet"
19
+ href="https://cdn.jsdelivr.net/gh/jpswalsh/academicons@1/css/academicons.min.css">
20
+ <link rel="stylesheet" href="./static/css/index.css">
21
+ <link rel="icon" href="./static/images/favicon.svg">
22
+
23
+ <script src="https://ajax.googleapis.com/ajax/libs/jquery/3.5.1/jquery.min.js"></script>
24
+ <script defer src="./static/js/fontawesome.all.min.js"></script>
25
+ <script src="./static/js/bulma-carousel.min.js"></script>
26
+ <script src="./static/js/bulma-slider.min.js"></script>
27
+ <script src="./static/js/index.js"></script>
28
  </head>
29
  <body>
 
 
 
 
 
 
 
30
 
31
+ <section class="hero">
32
+ <div class="hero-body">
33
+ <div class="container is-max-desktop">
34
+ <div class="columns is-centered">
35
+ <div class="column has-text-centered">
36
+ <h1 class="title is-1 publication-title">DeepSeek Research Papers</h1>
37
+ <div class="is-size-5 publication-authors">
38
+ <span class="author-block">DeepSeek Research Team</span>
39
+ </div>
40
+ </div>
41
+ </div>
42
+ </div>
43
+ </div>
44
+ </section>
45
 
46
+ <section class="hero teaser">
47
+ <div class="container is-max-desktop">
48
+ <div class="hero-body">
49
+ <h2 class="subtitle has-text-centered">
50
+ Advancing AI through Open Research and Innovation
51
+ </h2>
52
+ </div>
53
+ </div>
54
+ </section>
55
 
56
+ <section class="section">
57
+ <div class="container is-max-desktop">
58
+ <div class="columns is-centered">
59
+ <div class="column is-full-width">
60
+ <h2 class="title is-3 has-text-centered">Publications</h2>
61
+
62
+ <!-- Paper List Start -->
63
+ <div class="content">
64
+ <!-- Paper 1 -->
65
+ <div class="paper-item box">
66
+ <h3 class="title is-4">1. DeepSeek LLM: Scaling Open-Source Language Models with Longtermism</h3>
67
+ <p>Scaling open-source language models with a focus on longtermism.</p>
68
+ <div class="publication-links">
69
+ <span class="link-block">
70
+ <a href="https://huggingface.co/papers/2401.02954" target="_blank"
71
+ class="external-link button is-normal is-rounded is-dark">
72
+ <span class="icon">
73
+ <i class="fas fa-file-pdf"></i>
74
+ </span>
75
+ <span>Paper</span>
76
+ </a>
77
+ </span>
78
+ <span class="is-size-6 has-text-grey">{Jan 6, 2024}</span>
79
+ </div>
80
+ </div>
81
 
82
+ <!-- Paper 2 -->
83
+ <div class="paper-item box">
84
+ <h3 class="title is-4">2. DeepSeekMoE: Towards Ultimate Expert Specialization in Mixture-of-Experts Language Models</h3>
85
+ <p>Exploring expert specialization in Mixture-of-Experts language models.</p>
86
+ <div class="publication-links">
87
+ <span class="link-block">
88
+ <a href="https://arxiv.org/abs/2401.06066" target="_blank"
89
+ class="external-link button is-normal is-rounded is-dark">
90
+ <span class="icon">
91
+ <i class="fas fa-file-pdf"></i>
92
+ </span>
93
+ <span>Paper</span>
94
+ </a>
95
+ </span>
96
+ <span class="is-size-6 has-text-grey">{Jan 11, 2024}</span>
97
+ </div>
98
+ </div>
99
 
100
+ <!-- Remaining papers follow the same structure -->
101
+ <!-- Paper 3 to 17 would be added here with the same pattern -->
 
 
 
 
 
 
102
 
103
+ </div>
104
+ <!-- Paper List End -->
105
+
106
+ </div>
107
+ </div>
108
+ </div>
109
+ </section>
 
110
 
111
+ <footer class="footer">
112
+ <div class="container">
113
+ <div class="content has-text-centered">
114
+ <p>
115
+ © 2024 DeepSeek. All rights reserved.
116
+ </p>
117
+ <p>
118
+ This website is built using the Bulma CSS framework.
119
+ </p>
120
+ </div>
121
+ </div>
122
+ </footer>
123
 
 
 
 
 
124
  </body>
125
  </html>