File size: 4,452 Bytes
85bcb47
1cb8f7f
85bcb47
1cb8f7f
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
85bcb47
 
63c5240
1cb8f7f
 
 
 
 
 
 
 
 
 
 
 
 
 
63c5240
1cb8f7f
 
 
 
 
 
 
 
 
5852be1
1cb8f7f
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
63c5240
1cb8f7f
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
63c5240
1cb8f7f
 
bf1e8f3
1cb8f7f
 
 
 
 
 
 
89f340d
1cb8f7f
 
 
 
 
 
 
 
 
 
 
 
89f340d
85bcb47
94b76d5
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
<!DOCTYPE html>
<html>
<head>
  <meta charset="utf-8">
  <meta name="description"
        content="A collection of research papers from DeepSeek.">
  <meta name="keywords" content="DeepSeek, AI Research, Machine Learning">
  <meta name="viewport" content="width=device-width, initial-scale=1">
  <title>DeepSeek Research Papers</title>

  <link href="https://fonts.googleapis.com/css?family=Google+Sans|Noto+Sans|Castoro"
        rel="stylesheet">

  <link rel="stylesheet" href="./static/css/bulma.min.css">
  <link rel="stylesheet" href="./static/css/bulma-carousel.min.css">
  <link rel="stylesheet" href="./static/css/bulma-slider.min.css">
  <link rel="stylesheet" href="./static/css/fontawesome.all.min.css">
  <link rel="stylesheet"
        href="https://cdn.jsdelivr.net/gh/jpswalsh/academicons@1/css/academicons.min.css">
  <link rel="stylesheet" href="./static/css/index.css">
  <link rel="icon" href="./static/images/favicon.svg">

  <script src="https://ajax.googleapis.com/ajax/libs/jquery/3.5.1/jquery.min.js"></script>
  <script defer src="./static/js/fontawesome.all.min.js"></script>
  <script src="./static/js/bulma-carousel.min.js"></script>
  <script src="./static/js/bulma-slider.min.js"></script>
  <script src="./static/js/index.js"></script>
</head>
<body>

<section class="hero">
  <div class="hero-body">
    <div class="container is-max-desktop">
      <div class="columns is-centered">
        <div class="column has-text-centered">
          <h1 class="title is-1 publication-title">DeepSeek Research Papers</h1>
          <div class="is-size-5 publication-authors">
            <span class="author-block">DeepSeek Research Team</span>
          </div>
        </div>
      </div>
    </div>
  </div>
</section>

<section class="hero teaser">
  <div class="container is-max-desktop">
    <div class="hero-body">
      <h2 class="subtitle has-text-centered">
        Advancing AI through Open Research and Innovation
      </h2>
    </div>
  </div>
</section>

<section class="section">
  <div class="container is-max-desktop">
    <div class="columns is-centered">
      <div class="column is-full-width">
        <h2 class="title is-3 has-text-centered">Publications</h2>
        
        <!-- Paper List Start -->
        <div class="content">
          <!-- Paper 1 -->
          <div class="paper-item box">
            <h3 class="title is-4">1. DeepSeek LLM: Scaling Open-Source Language Models with Longtermism</h3>
            <p>Scaling open-source language models with a focus on longtermism.</p>
            <div class="publication-links">
              <span class="link-block">
                <a href="https://huggingface.co/papers/2401.02954" target="_blank"
                   class="external-link button is-normal is-rounded is-dark">
                  <span class="icon">
                      <i class="fas fa-file-pdf"></i>
                  </span>
                  <span>Paper</span>
                </a>
              </span>
              <span class="is-size-6 has-text-grey">{Jan 6, 2024}</span>
            </div>
          </div>

          <!-- Paper 2 -->
          <div class="paper-item box">
            <h3 class="title is-4">2. DeepSeekMoE: Towards Ultimate Expert Specialization in Mixture-of-Experts Language Models</h3>
            <p>Exploring expert specialization in Mixture-of-Experts language models.</p>
            <div class="publication-links">
              <span class="link-block">
                <a href="https://arxiv.org/abs/2401.06066" target="_blank"
                   class="external-link button is-normal is-rounded is-dark">
                  <span class="icon">
                      <i class="fas fa-file-pdf"></i>
                  </span>
                  <span>Paper</span>
                </a>
              </span>
              <span class="is-size-6 has-text-grey">{Jan 11, 2024}</span>
            </div>
          </div>

          <!-- Remaining papers follow the same structure -->
          <!-- Paper 3 to 17 would be added here with the same pattern -->

        </div>
        <!-- Paper List End -->
        
      </div>
    </div>
  </div>
</section>

<footer class="footer">
  <div class="container">
    <div class="content has-text-centered">
      <p>
        © 2024 DeepSeek. All rights reserved.
      </p>
      <p>
        This website is built using the Bulma CSS framework.
      </p>
    </div>
  </div>
</footer>

</body>
</html>