Spaces:
Running
Running
Check
Browse files- index.html +111 -66
index.html
CHANGED
@@ -1,80 +1,125 @@
|
|
1 |
<!DOCTYPE html>
|
2 |
-
<html
|
3 |
<head>
|
4 |
-
<meta charset="
|
5 |
-
<meta name="
|
6 |
-
|
7 |
-
<
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
8 |
</head>
|
9 |
<body>
|
10 |
-
<header>
|
11 |
-
<h1>DeepSeek Papers</h1>
|
12 |
-
</header>
|
13 |
-
|
14 |
-
<main>
|
15 |
-
<section>
|
16 |
-
<h2>DeepSeek Papers</h2>
|
17 |
|
18 |
-
|
19 |
-
|
20 |
-
|
21 |
-
|
22 |
-
|
23 |
-
|
24 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
25 |
|
26 |
-
|
27 |
-
|
28 |
-
|
29 |
-
|
30 |
-
|
31 |
-
|
32 |
-
|
|
|
|
|
33 |
|
34 |
-
|
35 |
-
|
36 |
-
|
37 |
-
|
38 |
-
|
39 |
-
|
40 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
41 |
|
42 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
43 |
|
44 |
-
|
45 |
-
|
46 |
-
<p>Description: Hardware-Aligned and Natively Trainable Sparse Attention.</p>
|
47 |
-
<ul>
|
48 |
-
<li><a href="https://arxiv.org/abs/2502.11089">Link to Paper</a> {Feb 16, 2025}</li>
|
49 |
-
</ul>
|
50 |
-
</article>
|
51 |
-
</section>
|
52 |
|
53 |
-
|
54 |
-
|
55 |
-
|
56 |
-
|
57 |
-
|
58 |
-
|
59 |
-
|
60 |
-
</section>
|
61 |
|
62 |
-
|
63 |
-
|
64 |
-
|
65 |
-
|
66 |
-
|
67 |
-
|
68 |
-
|
69 |
-
|
70 |
-
|
71 |
-
|
72 |
-
|
73 |
-
|
74 |
|
75 |
-
<footer>
|
76 |
-
<p>This website is licensed under a <a href="https://creativecommons.org/licenses/by-sa/4.0/">Creative Commons Attribution-ShareAlike 4.0 International License</a>.</p>
|
77 |
-
<p>This means you are free to borrow the <a href="source-code-link">source code</a> of this website; we just ask that you link back to this page in the footer. Please remember to remove the analytics code included in the header of the website which you do not want on your website.</p>
|
78 |
-
</footer>
|
79 |
</body>
|
80 |
</html>
|
|
|
1 |
<!DOCTYPE html>
|
2 |
+
<html>
|
3 |
<head>
|
4 |
+
<meta charset="utf-8">
|
5 |
+
<meta name="description"
|
6 |
+
content="A collection of research papers from DeepSeek.">
|
7 |
+
<meta name="keywords" content="DeepSeek, AI Research, Machine Learning">
|
8 |
+
<meta name="viewport" content="width=device-width, initial-scale=1">
|
9 |
+
<title>DeepSeek Research Papers</title>
|
10 |
+
|
11 |
+
<link href="https://fonts.googleapis.com/css?family=Google+Sans|Noto+Sans|Castoro"
|
12 |
+
rel="stylesheet">
|
13 |
+
|
14 |
+
<link rel="stylesheet" href="./static/css/bulma.min.css">
|
15 |
+
<link rel="stylesheet" href="./static/css/bulma-carousel.min.css">
|
16 |
+
<link rel="stylesheet" href="./static/css/bulma-slider.min.css">
|
17 |
+
<link rel="stylesheet" href="./static/css/fontawesome.all.min.css">
|
18 |
+
<link rel="stylesheet"
|
19 |
+
href="https://cdn.jsdelivr.net/gh/jpswalsh/academicons@1/css/academicons.min.css">
|
20 |
+
<link rel="stylesheet" href="./static/css/index.css">
|
21 |
+
<link rel="icon" href="./static/images/favicon.svg">
|
22 |
+
|
23 |
+
<script src="https://ajax.googleapis.com/ajax/libs/jquery/3.5.1/jquery.min.js"></script>
|
24 |
+
<script defer src="./static/js/fontawesome.all.min.js"></script>
|
25 |
+
<script src="./static/js/bulma-carousel.min.js"></script>
|
26 |
+
<script src="./static/js/bulma-slider.min.js"></script>
|
27 |
+
<script src="./static/js/index.js"></script>
|
28 |
</head>
|
29 |
<body>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
30 |
|
31 |
+
<section class="hero">
|
32 |
+
<div class="hero-body">
|
33 |
+
<div class="container is-max-desktop">
|
34 |
+
<div class="columns is-centered">
|
35 |
+
<div class="column has-text-centered">
|
36 |
+
<h1 class="title is-1 publication-title">DeepSeek Research Papers</h1>
|
37 |
+
<div class="is-size-5 publication-authors">
|
38 |
+
<span class="author-block">DeepSeek Research Team</span>
|
39 |
+
</div>
|
40 |
+
</div>
|
41 |
+
</div>
|
42 |
+
</div>
|
43 |
+
</div>
|
44 |
+
</section>
|
45 |
|
46 |
+
<section class="hero teaser">
|
47 |
+
<div class="container is-max-desktop">
|
48 |
+
<div class="hero-body">
|
49 |
+
<h2 class="subtitle has-text-centered">
|
50 |
+
Advancing AI through Open Research and Innovation
|
51 |
+
</h2>
|
52 |
+
</div>
|
53 |
+
</div>
|
54 |
+
</section>
|
55 |
|
56 |
+
<section class="section">
|
57 |
+
<div class="container is-max-desktop">
|
58 |
+
<div class="columns is-centered">
|
59 |
+
<div class="column is-full-width">
|
60 |
+
<h2 class="title is-3 has-text-centered">Publications</h2>
|
61 |
+
|
62 |
+
<!-- Paper List Start -->
|
63 |
+
<div class="content">
|
64 |
+
<!-- Paper 1 -->
|
65 |
+
<div class="paper-item box">
|
66 |
+
<h3 class="title is-4">1. DeepSeek LLM: Scaling Open-Source Language Models with Longtermism</h3>
|
67 |
+
<p>Scaling open-source language models with a focus on longtermism.</p>
|
68 |
+
<div class="publication-links">
|
69 |
+
<span class="link-block">
|
70 |
+
<a href="https://huggingface.co/papers/2401.02954" target="_blank"
|
71 |
+
class="external-link button is-normal is-rounded is-dark">
|
72 |
+
<span class="icon">
|
73 |
+
<i class="fas fa-file-pdf"></i>
|
74 |
+
</span>
|
75 |
+
<span>Paper</span>
|
76 |
+
</a>
|
77 |
+
</span>
|
78 |
+
<span class="is-size-6 has-text-grey">{Jan 6, 2024}</span>
|
79 |
+
</div>
|
80 |
+
</div>
|
81 |
|
82 |
+
<!-- Paper 2 -->
|
83 |
+
<div class="paper-item box">
|
84 |
+
<h3 class="title is-4">2. DeepSeekMoE: Towards Ultimate Expert Specialization in Mixture-of-Experts Language Models</h3>
|
85 |
+
<p>Exploring expert specialization in Mixture-of-Experts language models.</p>
|
86 |
+
<div class="publication-links">
|
87 |
+
<span class="link-block">
|
88 |
+
<a href="https://arxiv.org/abs/2401.06066" target="_blank"
|
89 |
+
class="external-link button is-normal is-rounded is-dark">
|
90 |
+
<span class="icon">
|
91 |
+
<i class="fas fa-file-pdf"></i>
|
92 |
+
</span>
|
93 |
+
<span>Paper</span>
|
94 |
+
</a>
|
95 |
+
</span>
|
96 |
+
<span class="is-size-6 has-text-grey">{Jan 11, 2024}</span>
|
97 |
+
</div>
|
98 |
+
</div>
|
99 |
|
100 |
+
<!-- Remaining papers follow the same structure -->
|
101 |
+
<!-- Paper 3 to 17 would be added here with the same pattern -->
|
|
|
|
|
|
|
|
|
|
|
|
|
102 |
|
103 |
+
</div>
|
104 |
+
<!-- Paper List End -->
|
105 |
+
|
106 |
+
</div>
|
107 |
+
</div>
|
108 |
+
</div>
|
109 |
+
</section>
|
|
|
110 |
|
111 |
+
<footer class="footer">
|
112 |
+
<div class="container">
|
113 |
+
<div class="content has-text-centered">
|
114 |
+
<p>
|
115 |
+
© 2024 DeepSeek. All rights reserved.
|
116 |
+
</p>
|
117 |
+
<p>
|
118 |
+
This website is built using the Bulma CSS framework.
|
119 |
+
</p>
|
120 |
+
</div>
|
121 |
+
</div>
|
122 |
+
</footer>
|
123 |
|
|
|
|
|
|
|
|
|
124 |
</body>
|
125 |
</html>
|