Compare commits
8 Commits
fbb3df94b2
...
main
| Author | SHA1 | Date | |
|---|---|---|---|
| 251afa8526 | |||
| e19f0bf0f1 | |||
| e5a591e03c | |||
| 4af1ed18a3 | |||
| 6d72e37eee | |||
| edd19df2a2 | |||
| 6f140c7845 | |||
| 22f5378e54 |
78
.github/workflows/hugo.yaml
vendored
78
.github/workflows/hugo.yaml
vendored
@@ -1,78 +0,0 @@
|
||||
# Sample workflow for building and deploying a Hugo site to GitHub Pages
|
||||
name: Deploy Hugo site to Pages
|
||||
|
||||
on:
|
||||
# Runs on pushes targeting the default branch
|
||||
push:
|
||||
branches:
|
||||
- main
|
||||
|
||||
# Allows you to run this workflow manually from the Actions tab
|
||||
workflow_dispatch:
|
||||
|
||||
# Sets permissions of the GITHUB_TOKEN to allow deployment to GitHub Pages
|
||||
permissions:
|
||||
contents: read
|
||||
pages: write
|
||||
id-token: write
|
||||
|
||||
# Allow only one concurrent deployment, skipping runs queued between the run in-progress and latest queued.
|
||||
# However, do NOT cancel in-progress runs as we want to allow these production deployments to complete.
|
||||
concurrency:
|
||||
group: "pages"
|
||||
cancel-in-progress: false
|
||||
|
||||
# Default to bash
|
||||
defaults:
|
||||
run:
|
||||
shell: bash
|
||||
|
||||
jobs:
|
||||
# Build job
|
||||
build:
|
||||
runs-on: ubuntu-latest
|
||||
env:
|
||||
HUGO_VERSION: 0.124.0
|
||||
steps:
|
||||
- name: Install Hugo CLI
|
||||
run: |
|
||||
wget -O ${{ runner.temp }}/hugo.deb https://github.com/gohugoio/hugo/releases/download/v${HUGO_VERSION}/hugo_extended_${HUGO_VERSION}_linux-amd64.deb \
|
||||
&& sudo dpkg -i ${{ runner.temp }}/hugo.deb
|
||||
- name: Install Dart Sass
|
||||
run: sudo snap install dart-sass
|
||||
- name: Checkout
|
||||
uses: actions/checkout@v4
|
||||
with:
|
||||
submodules: recursive
|
||||
fetch-depth: 0
|
||||
- name: Setup Pages
|
||||
id: pages
|
||||
uses: actions/configure-pages@v4
|
||||
- name: Install Node.js dependencies
|
||||
run: "[[ -f package-lock.json || -f npm-shrinkwrap.json ]] && npm ci || true"
|
||||
- name: Build with Hugo
|
||||
env:
|
||||
# For maximum backward compatibility with Hugo modules
|
||||
HUGO_ENVIRONMENT: production
|
||||
HUGO_ENV: production
|
||||
run: |
|
||||
hugo \
|
||||
--gc \
|
||||
--minify \
|
||||
--baseURL "${{ steps.pages.outputs.base_url }}/"
|
||||
- name: Upload artifact
|
||||
uses: actions/upload-pages-artifact@v3
|
||||
with:
|
||||
path: ./public
|
||||
|
||||
# Deployment job
|
||||
deploy:
|
||||
environment:
|
||||
name: github-pages
|
||||
url: ${{ steps.deployment.outputs.page_url }}
|
||||
runs-on: ubuntu-latest
|
||||
needs: build
|
||||
steps:
|
||||
- name: Deploy to GitHub Pages
|
||||
id: deployment
|
||||
uses: actions/deploy-pages@v4
|
||||
@@ -79,7 +79,7 @@
|
||||
* Global font family
|
||||
*/
|
||||
:root {
|
||||
--code-font-family: 'Jetbrains Mono', Menlo, Monaco, Consolas, 'Courier New',
|
||||
--code-font-family: 'Maple Font Mono', Menlo, Monaco, Consolas, 'Courier New',
|
||||
var(--zh-font-family), monospace;
|
||||
}
|
||||
|
||||
|
||||
21
config.yaml
21
config.yaml
@@ -1,25 +1,22 @@
|
||||
baseurl: https://www.taurusxin.com
|
||||
languageCode: zh-cn
|
||||
theme: hugo-theme-stack
|
||||
pagination:
|
||||
pagerSize: 10
|
||||
title: TaurusXin 的独立博客
|
||||
|
||||
# Change it to your Disqus shortname before using
|
||||
disqusShortname: taurusxin
|
||||
|
||||
# GA Tracking ID
|
||||
googleAnalytics:
|
||||
|
||||
# Theme i18n support
|
||||
# Available values: en, fr, id, ja, ko, pt-br, zh-cn, zh-tw, es, de, nl, it, th, el, uk
|
||||
DefaultContentLanguage: zh-cn
|
||||
|
||||
# Set hasCJKLanguage to true if DefaultContentLanguage is in [zh-cn ja ko]
|
||||
# This will make .Summary and .WordCount behave correctly for CJK languages.
|
||||
hasCJKLanguage: false
|
||||
services:
|
||||
# Change it to your Disqus shortname before using
|
||||
disqus:
|
||||
shortname: "taurusxin"
|
||||
# GA Tracking ID
|
||||
googleAnalytics:
|
||||
id: "G-KN4M42XST7"
|
||||
|
||||
enableRobotsTXT: true
|
||||
pagination:
|
||||
pagerSize: 10
|
||||
|
||||
permalinks:
|
||||
post: /:slug/
|
||||
|
||||
@@ -12,8 +12,23 @@ edit: false
|
||||
comment: true
|
||||
---
|
||||
|
||||
### 申请要求
|
||||
|
||||
感谢添加我为友链,作为互联网的一个独立的小角落,也希望您的网站能够满足以下几点简单的要求
|
||||
|
||||
- 有超过 5 篇独立的原创文章
|
||||
- 网站使用独立的付费域名,使用标准 HTTPS 端口(443),开启 SSL 证书
|
||||
- 不接受包括但不限于以下内容的友链申请
|
||||
- 带有推广性质(云服务、广告等)的博客
|
||||
- 论坛
|
||||
- 资源分享
|
||||
|
||||
我将每个季度审查一次所有已添加友链的网站,若发现网站无法访问或不符合上述要求,将移除该友链
|
||||
|
||||
### 友链申请格式
|
||||
|
||||
请按以下格式在评论区留言~
|
||||
|
||||
> 网站名称:TaurusXin 的独立博客
|
||||
>
|
||||
> 网站链接:<https://www.taurusxin.com>
|
||||
|
||||
90
content/post/088.cerebras/index.md
Normal file
90
content/post/088.cerebras/index.md
Normal file
@@ -0,0 +1,90 @@
|
||||
---
|
||||
title: "世界上最快的 AI 模型提供商 Cerebras"
|
||||
categories: [ "AIGC" ]
|
||||
tags: [ "ai", "llm" ]
|
||||
draft: false
|
||||
slug: "cerebras"
|
||||
date: "2025-11-10T13:51:00+0800"
|
||||
---
|
||||
|
||||
## 前言
|
||||
|
||||
好久没更新文章了,关于 AIGC 相关的文章(部署、使用、MCP……),网络上可有太多现有的文章,我就不在这里过多赘述了。
|
||||
|
||||
但是最近我注意到了一个新的 AI 模型提供商,让我瞬间眼前一亮。
|
||||
|
||||
介绍给各位使用 —— Cerebras
|
||||
|
||||
## 模型对比
|
||||
|
||||
|
||||
|
||||
在测试 cerebras 前,我们先来看看其他接口模型的 Token 生成速度,我日常会使用到的提供商有:硅基流动、火山引擎包括最近开始使用的的阿里云百炼。
|
||||
|
||||
测试环境为:
|
||||
|
||||
- Cherry Studio
|
||||
|
||||
模型有:
|
||||
|
||||
- 硅基流动 - DeepSeek V3.1
|
||||
- 火山引擎方舟 - DeepSeek V3.1 Termius
|
||||
- 阿里云百炼国际版 - Qwen3 Max
|
||||
|
||||
使用的 prompt 如下,所有模型配置均为默认,没有系统提示词
|
||||
|
||||
```text
|
||||
请你帮我编写一个 React 应用程序,使用 TypeScript 语言,且不使用任何其它库,程序的内容如下
|
||||
|
||||
1. 一个 Todo List App,具备基本的功能(添加、删除、标记完成、取消标记等)
|
||||
2. 支持为未来设定待办事项
|
||||
3. 支持保存数据到本地,每次打开或刷新浏览器时都能保持数据
|
||||
```
|
||||
|
||||
结果如下
|
||||
|
||||
| 提供商 | 模型 | 首字延迟(ms) | 输入Token数 | 输出 Token 数 | 输出耗时 | 输出速度(Token/s) |
|
||||
| ---------------- | --------------------- | -------------- | ----------- | ------------- | -------- | ------------------- |
|
||||
| 硅基流动 | DeepSeek V3.1 | 727 | 83 | 2306 | 121.3 | 19.01 |
|
||||
| 火山引擎方舟 | DeepSeek V3.1 Termius | 712 | 81 | 3331 | 95.1 | 35.03 |
|
||||
| 阿里云百炼国际版 | Qwen3 Max | 1487 | 88 | 2877 | 82.2 | 35 |
|
||||
|
||||
> 请注意:该测试仅评估模型输出速率,不评估模型输出内容质量
|
||||
|
||||
基本都是在 50 T/s 以下,当然这仅仅是一个对我我常用的模型接口的随机测试,不能代表所有模型设施的性能。
|
||||
|
||||
## Cerebras
|
||||
|
||||
打开 cerebras 的官网,就能看到大大的一行 “世界最快 AI 基础设施” 的字样,可见他们对自家 API 的对话生成速度非常自信
|
||||
|
||||

|
||||
|
||||
文档中介绍的速度均可达到 2-3 kT/s,非常恐怖,目前支持的模型不多, `qwen3-code-480b`
|
||||
|
||||

|
||||
|
||||
最后我们就来实际测试一下 cerebras,注册好账号后,生成一个 key,导入到 Cherry Studio,模型使用最快的 `OpenAI GPT OSS`,然后要做的,就是点击发送
|
||||
|
||||
| 提供商 | 模型 | 首字延迟(ms) | 输入Token数 | 输出 Token 数 | 输出耗时 | 输出速度(Token/s) |
|
||||
| -------- | ------- | -------------- | ----------- | ------------- | -------- | ------------------- |
|
||||
| Cerebras | GPT OSS | 656 | 183 | 3265 | 1.48 | 2197.17 |
|
||||
|
||||
速度达到恐怖的 2200T/s,整个生成过程在 1.5 秒内完成
|
||||
|
||||
来看看实际效果,这里我录了一个视频
|
||||
|
||||
{{< video "https://cdn.taurusxin.com/hugo/2025/11/10/cerebras-gptoss.mov" >}}
|
||||
|
||||
按下发送按钮后的不到 2 秒,整个组件的完整代码都生成完了,一气呵成。
|
||||
|
||||
如果把它用在代码编辑器辅助编程效果会非常爽,具体方案是 `VSCode + Cline 插件`,效果会非常爽,只不过一定要注意 Token 消耗,速度快了,Token 消耗也会快很多,一不小心很容易超出免费额度。
|
||||
|
||||
## 总结
|
||||
|
||||
Cerebras 目前知道的人并不多,价格表在 <https://www.cerebras.ai/pricing>
|
||||
|
||||

|
||||
|
||||
目前还推出了官方的 Code 服务 `Cerebras Code`,每天可用 2400 万 Token,最高 131k 的上下文支持,价格相较于其他代码生成服务比较贵,$50 每月,不过对于这么快的生成速度,也能接受。
|
||||
|
||||
至于免费版,我没有在文档中找到免费额度是每天或者每月多少,有找到的小伙伴可以说一下,免费版和付费版的输出速度是一样的,这点好评。
|
||||
@@ -16,25 +16,15 @@
|
||||
|
||||
<style>
|
||||
@font-face{
|
||||
font-family: 'JetBrains Mono';
|
||||
src: url('https://cdn.taurusxin.com/hugo/assets/fonts/JetBrainsMono/JetBrainsMono-Regular.woff2') format('woff2'),
|
||||
url('https://cdn.taurusxin.com/hugo/assets/fonts/JetBrainsMono/JetBrainsMono-Regular.woff') format('woff'),
|
||||
url('https://cdn.taurusxin.com/hugo/assets/fonts/JetBrainsMono/JetBrainsMono-Regular.ttf') format('truetype');
|
||||
font-family: 'Maple Font Mono';
|
||||
src: url('https://cdn.taurusxin.com/hugo/assets/fonts/MapleFontMono/MapleMono-Regular.woff2') format('woff2'),
|
||||
url('https://cdn.taurusxin.com/hugo/assets/fonts/MapleFontMono/MapleMono-Regular.woff') format('woff'),
|
||||
url('https://cdn.taurusxin.com/hugo/assets/fonts/MapleFontMono/MapleMono-Regular.ttf') format('truetype');
|
||||
font-weight: 400;
|
||||
font-style: normal;
|
||||
}
|
||||
</style>
|
||||
|
||||
<!-- Google tag (gtag.js) -->
|
||||
<script async src="https://www.googletagmanager.com/gtag/js?id=G-KN4M42XST7"></script>
|
||||
<script>
|
||||
window.dataLayer = window.dataLayer || [];
|
||||
function gtag(){dataLayer.push(arguments);}
|
||||
gtag('js', new Date());
|
||||
|
||||
gtag('config', 'G-KN4M42XST7');
|
||||
</script>
|
||||
|
||||
<!-- Baidu Analytics -->
|
||||
<script>
|
||||
var _hmt = _hmt || [];
|
||||
|
||||
Submodule themes/hugo-theme-stack updated: 9e6b7b22a9...73ccacec4d
Reference in New Issue
Block a user