初次提交

This commit is contained in:
Kynix Chen 2024-08-16 18:34:05 +08:00
commit b63f0c07b8
18 changed files with 44718 additions and 0 deletions

8
.idea/.gitignore vendored Normal file
View File

@ -0,0 +1,8 @@
# Default ignored files
/shelf/
/workspace.xml
# Editor-based HTTP Client requests
/httpRequests/
# Datasource local storage ignored files
/dataSources/
/dataSources.local.xml

9
.idea/DewvineAPI.iml Normal file
View File

@ -0,0 +1,9 @@
<?xml version="1.0" encoding="UTF-8"?>
<module type="WEB_MODULE" version="4">
<component name="Go" enabled="true" />
<component name="NewModuleRootManager">
<content url="file://$MODULE_DIR$" />
<orderEntry type="inheritedJdk" />
<orderEntry type="sourceFolder" forTests="false" />
</component>
</module>

View File

@ -0,0 +1,7 @@
{
"enableAutoRestart" : false,
"scanSuffix" : "java,rs,kt,go,py",
"scanPath" : "",
"fileSuffix" : "java,rs,kt,go,py,md,zig",
"excludePath" : ".idea,.gradle,.git,node_modules,build"
}

8
.idea/modules.xml Normal file
View File

@ -0,0 +1,8 @@
<?xml version="1.0" encoding="UTF-8"?>
<project version="4">
<component name="ProjectModuleManager">
<modules>
<module fileurl="file://$PROJECT_DIR$/.idea/DewvineAPI.iml" filepath="$PROJECT_DIR$/.idea/DewvineAPI.iml" />
</modules>
</component>
</project>

17
Dockerfile Normal file
View File

@ -0,0 +1,17 @@
# 使用Golang的基础镜像
FROM golang:latest
# 设置工作目录
WORKDIR /app
# 将本地的代码复制到容器中
COPY . .
# 构建应用程序
RUN go build -o main .
# 暴露容器的端口
EXPOSE 7080
# 运行应用程序
CMD ["./main"]

57
README.md Normal file
View File

@ -0,0 +1,57 @@
# 蔓露 Dewvine
承襲自<a href="https://developer.hitokoto.cn/">一言</a>的中文精確校正語料庫。
## 介紹
中文名字“**蔓露**”取自《詩經·鄭風·野有蔓草》,原文是“野有蔓草,零露漙兮。”
本文描寫了在一個露珠未乾的清晨,與一位美麗的女子的浪漫邂逅。希望專案中經過校閱的每一個句子,都能夠像文中一樣,與你的心靈產生共鳴,與你來一場美妙的遇見。
本專案承襲自<a href="https://developer.hitokoto.cn/">一言</a>,並繼承前輩<a href="https://github.com/elegant-tw">言雅</a>之精神。由於一言僅支援簡體中文的缺陷,本專案在對一言的原始資料進行了繁體中文轉換,並在轉換後進行人工校閱,修正了某些錯誤的格式。
一言共提供動畫、漫畫、遊戲、文學、原創、來自網路、其他、影視、詩詞、網易雲、哲學、抖機靈等十三種類型的句子,本專案根據個人喜好,僅保留其中**文學、來自網路、詩詞和哲學**四類,並對其中某些露骨和低俗的句子進行人工刪改。
除提供繁體中文服務,蔓露也保留了校閱後的簡體中文版本。
## 使用
### 使用語料庫
語料庫採用 json 格式儲存,位於 `data` 目錄下,可直接下載或 Clone 使用。
### 使用 API
#### 手動部署
本 API 使用 `go` 寫成,因此請確保你的環境中有配置好 `go` 環境。
1. 下載專案
```bash
git clone https://merak.axiomatrix.org/Axiomatrix_Org/Dewvine.git
cd Dewvine
```
2. 補齊依賴的模組
```bash
go mod tidy
```
3. 執行專案
```bash
go run main.go
```
後台執行:
```bash
nohup go run main.go &
```
#### Docker 部署
本專案已經將 docker image 傳送至 Docker Hub你可以直接使用以下指令部署
```bash
docker run -d -p 7080:7080 kynixtw/dewvine:latest
```
或者使用 `docker-compose` 部署。本專案提供一個 `docker-compose.yml` 模板,你可以直接使用以下指令部署:
```bash
docker-compose up -d
```

4306
data/zh-CN/internet.json Normal file

File diff suppressed because it is too large Load Diff

10706
data/zh-CN/literature.json Normal file

File diff suppressed because it is too large Load Diff

1602
data/zh-CN/philosophy.json Normal file

File diff suppressed because it is too large Load Diff

5530
data/zh-CN/poem.json Normal file

File diff suppressed because it is too large Load Diff

4306
data/zh-TW/internet.json Normal file

File diff suppressed because it is too large Load Diff

10706
data/zh-TW/literature.json Normal file

File diff suppressed because it is too large Load Diff

1602
data/zh-TW/philosophy.json Normal file

File diff suppressed because it is too large Load Diff

5530
data/zh-TW/poem.json Normal file

File diff suppressed because it is too large Load Diff

8
docker-compose.yml Normal file
View File

@ -0,0 +1,8 @@
version: '3.8'
services:
dewvine:
container_name: dewvine
image: kynixtw/dewvine:2024
ports:
- "7080:7080"

39
go.mod Normal file
View File

@ -0,0 +1,39 @@
module DewvineAPI
go 1.22
require github.com/gin-gonic/gin v1.10.0
require (
github.com/bytedance/sonic v1.11.9 // indirect
github.com/bytedance/sonic/loader v0.1.1 // indirect
github.com/cloudwego/base64x v0.1.4 // indirect
github.com/cloudwego/iasm v0.2.0 // indirect
github.com/gabriel-vasile/mimetype v1.4.4 // indirect
github.com/gin-contrib/sse v0.1.0 // indirect
github.com/go-playground/locales v0.14.1 // indirect
github.com/go-playground/universal-translator v0.18.1 // indirect
github.com/go-playground/validator/v10 v10.22.0 // indirect
github.com/goccy/go-json v0.10.3 // indirect
github.com/google/go-cmp v0.6.0 // indirect
github.com/json-iterator/go v1.1.12 // indirect
github.com/klauspost/cpuid/v2 v2.2.8 // indirect
github.com/kr/pretty v0.3.1 // indirect
github.com/leodido/go-urn v1.4.0 // indirect
github.com/mattn/go-isatty v0.0.20 // indirect
github.com/modern-go/concurrent v0.0.0-20180306012644-bacd9c7ef1dd // indirect
github.com/modern-go/reflect2 v1.0.2 // indirect
github.com/pelletier/go-toml/v2 v2.2.2 // indirect
github.com/rogpeppe/go-internal v1.11.0 // indirect
github.com/twitchyliquid64/golang-asm v0.15.1 // indirect
github.com/ugorji/go/codec v1.2.12 // indirect
golang.org/x/arch v0.8.0 // indirect
golang.org/x/crypto v0.25.0 // indirect
golang.org/x/net v0.27.0 // indirect
golang.org/x/sys v0.22.0 // indirect
golang.org/x/text v0.16.0 // indirect
google.golang.org/protobuf v1.34.2 // indirect
gopkg.in/check.v1 v1.0.0-20201130134442-10cb98267c6c // indirect
gopkg.in/yaml.v3 v3.0.1 // indirect
merak.axiomatrix.org/Axiomatrix_Org/optimized_go_tools v0.0.0-20240806071711-ae889abd1da4 // indirect
)

102
go.sum Normal file
View File

@ -0,0 +1,102 @@
github.com/bytedance/sonic v1.11.9 h1:LFHENlIY/SLzDWverzdOvgMztTxcfcF+cqNsz9pK5zg=
github.com/bytedance/sonic v1.11.9/go.mod h1:LysEHSvpvDySVdC2f87zGWf6CIKJcAvqab1ZaiQtds4=
github.com/bytedance/sonic/loader v0.1.1 h1:c+e5Pt1k/cy5wMveRDyk2X4B9hF4g7an8N3zCYjJFNM=
github.com/bytedance/sonic/loader v0.1.1/go.mod h1:ncP89zfokxS5LZrJxl5z0UJcsk4M4yY2JpfqGeCtNLU=
github.com/cloudwego/base64x v0.1.4 h1:jwCgWpFanWmN8xoIUHa2rtzmkd5J2plF/dnLS6Xd/0Y=
github.com/cloudwego/base64x v0.1.4/go.mod h1:0zlkT4Wn5C6NdauXdJRhSKRlJvmclQ1hhJgA0rcu/8w=
github.com/cloudwego/iasm v0.2.0 h1:1KNIy1I1H9hNNFEEH3DVnI4UujN+1zjpuk6gwHLTssg=
github.com/cloudwego/iasm v0.2.0/go.mod h1:8rXZaNYT2n95jn+zTI1sDr+IgcD2GVs0nlbbQPiEFhY=
github.com/creack/pty v1.1.9/go.mod h1:oKZEueFk5CKHvIhNR5MUki03XCEU+Q6VDXinZuGJ33E=
github.com/davecgh/go-spew v1.1.0/go.mod h1:J7Y8YcW2NihsgmVo/mv3lAwl/skON4iLHjSsI+c5H38=
github.com/davecgh/go-spew v1.1.1 h1:vj9j/u1bqnvCEfJOwUhtlOARqs3+rkHYY13jYWTU97c=
github.com/davecgh/go-spew v1.1.1/go.mod h1:J7Y8YcW2NihsgmVo/mv3lAwl/skON4iLHjSsI+c5H38=
github.com/gabriel-vasile/mimetype v1.4.4 h1:QjV6pZ7/XZ7ryI2KuyeEDE8wnh7fHP9YnQy+R0LnH8I=
github.com/gabriel-vasile/mimetype v1.4.4/go.mod h1:JwLei5XPtWdGiMFB5Pjle1oEeoSeEuJfJE+TtfvdB/s=
github.com/gin-contrib/sse v0.1.0 h1:Y/yl/+YNO8GZSjAhjMsSuLt29uWRFHdHYUb5lYOV9qE=
github.com/gin-contrib/sse v0.1.0/go.mod h1:RHrZQHXnP2xjPF+u1gW/2HnVO7nvIa9PG3Gm+fLHvGI=
github.com/gin-gonic/gin v1.10.0 h1:nTuyha1TYqgedzytsKYqna+DfLos46nTv2ygFy86HFU=
github.com/gin-gonic/gin v1.10.0/go.mod h1:4PMNQiOhvDRa013RKVbsiNwoyezlm2rm0uX/T7kzp5Y=
github.com/go-playground/assert/v2 v2.2.0 h1:JvknZsQTYeFEAhQwI4qEt9cyV5ONwRHC+lYKSsYSR8s=
github.com/go-playground/assert/v2 v2.2.0/go.mod h1:VDjEfimB/XKnb+ZQfWdccd7VUvScMdVu0Titje2rxJ4=
github.com/go-playground/locales v0.14.1 h1:EWaQ/wswjilfKLTECiXz7Rh+3BjFhfDFKv/oXslEjJA=
github.com/go-playground/locales v0.14.1/go.mod h1:hxrqLVvrK65+Rwrd5Fc6F2O76J/NuW9t0sjnWqG1slY=
github.com/go-playground/universal-translator v0.18.1 h1:Bcnm0ZwsGyWbCzImXv+pAJnYK9S473LQFuzCbDbfSFY=
github.com/go-playground/universal-translator v0.18.1/go.mod h1:xekY+UJKNuX9WP91TpwSH2VMlDf28Uj24BCp08ZFTUY=
github.com/go-playground/validator/v10 v10.22.0 h1:k6HsTZ0sTnROkhS//R0O+55JgM8C4Bx7ia+JlgcnOao=
github.com/go-playground/validator/v10 v10.22.0/go.mod h1:dbuPbCMFw/DrkbEynArYaCwl3amGuJotoKCe95atGMM=
github.com/goccy/go-json v0.10.3 h1:KZ5WoDbxAIgm2HNbYckL0se1fHD6rz5j4ywS6ebzDqA=
github.com/goccy/go-json v0.10.3/go.mod h1:oq7eo15ShAhp70Anwd5lgX2pLfOS3QCiwU/PULtXL6M=
github.com/google/go-cmp v0.6.0 h1:ofyhxvXcZhMsU5ulbFiLKl/XBFqE1GSq7atu8tAmTRI=
github.com/google/go-cmp v0.6.0/go.mod h1:17dUlkBOakJ0+DkrSSNjCkIjxS6bF9zb3elmeNGIjoY=
github.com/google/gofuzz v1.0.0/go.mod h1:dBl0BpW6vV/+mYPU4Po3pmUjxk6FQPldtuIdl/M65Eg=
github.com/json-iterator/go v1.1.12 h1:PV8peI4a0ysnczrg+LtxykD8LfKY9ML6u2jnxaEnrnM=
github.com/json-iterator/go v1.1.12/go.mod h1:e30LSqwooZae/UwlEbR2852Gd8hjQvJoHmT4TnhNGBo=
github.com/klauspost/cpuid/v2 v2.0.9/go.mod h1:FInQzS24/EEf25PyTYn52gqo7WaD8xa0213Md/qVLRg=
github.com/klauspost/cpuid/v2 v2.2.8 h1:+StwCXwm9PdpiEkPyzBXIy+M9KUb4ODm0Zarf1kS5BM=
github.com/klauspost/cpuid/v2 v2.2.8/go.mod h1:Lcz8mBdAVJIBVzewtcLocK12l3Y+JytZYpaMropDUws=
github.com/knz/go-libedit v1.10.1/go.mod h1:MZTVkCWyz0oBc7JOWP3wNAzd002ZbM/5hgShxwh4x8M=
github.com/kr/pretty v0.2.1/go.mod h1:ipq/a2n7PKx3OHsz4KJII5eveXtPO4qwEXGdVfWzfnI=
github.com/kr/pretty v0.3.1 h1:flRD4NNwYAUpkphVc1HcthR4KEIFJ65n8Mw5qdRn3LE=
github.com/kr/pretty v0.3.1/go.mod h1:hoEshYVHaxMs3cyo3Yncou5ZscifuDolrwPKZanG3xk=
github.com/kr/pty v1.1.1/go.mod h1:pFQYn66WHrOpPYNljwOMqo10TkYh1fy3cYio2l3bCsQ=
github.com/kr/text v0.1.0/go.mod h1:4Jbv+DJW3UT/LiOwJeYQe1efqtUx/iVham/4vfdArNI=
github.com/kr/text v0.2.0 h1:5Nx0Ya0ZqY2ygV366QzturHI13Jq95ApcVaJBhpS+AY=
github.com/kr/text v0.2.0/go.mod h1:eLer722TekiGuMkidMxC/pM04lWEeraHUUmBw8l2grE=
github.com/leodido/go-urn v1.4.0 h1:WT9HwE9SGECu3lg4d/dIA+jxlljEa1/ffXKmRjqdmIQ=
github.com/leodido/go-urn v1.4.0/go.mod h1:bvxc+MVxLKB4z00jd1z+Dvzr47oO32F/QSNjSBOlFxI=
github.com/mattn/go-isatty v0.0.20 h1:xfD0iDuEKnDkl03q4limB+vH+GxLEtL/jb4xVJSWWEY=
github.com/mattn/go-isatty v0.0.20/go.mod h1:W+V8PltTTMOvKvAeJH7IuucS94S2C6jfK/D7dTCTo3Y=
github.com/modern-go/concurrent v0.0.0-20180228061459-e0a39a4cb421/go.mod h1:6dJC0mAP4ikYIbvyc7fijjWJddQyLn8Ig3JB5CqoB9Q=
github.com/modern-go/concurrent v0.0.0-20180306012644-bacd9c7ef1dd h1:TRLaZ9cD/w8PVh93nsPXa1VrQ6jlwL5oN8l14QlcNfg=
github.com/modern-go/concurrent v0.0.0-20180306012644-bacd9c7ef1dd/go.mod h1:6dJC0mAP4ikYIbvyc7fijjWJddQyLn8Ig3JB5CqoB9Q=
github.com/modern-go/reflect2 v1.0.2 h1:xBagoLtFs94CBntxluKeaWgTMpvLxC4ur3nMaC9Gz0M=
github.com/modern-go/reflect2 v1.0.2/go.mod h1:yWuevngMOJpCy52FWWMvUC8ws7m/LJsjYzDa0/r8luk=
github.com/pelletier/go-toml/v2 v2.2.2 h1:aYUidT7k73Pcl9nb2gScu7NSrKCSHIDE89b3+6Wq+LM=
github.com/pelletier/go-toml/v2 v2.2.2/go.mod h1:1t835xjRzz80PqgE6HHgN2JOsmgYu/h4qDAS4n929Rs=
github.com/pkg/diff v0.0.0-20210226163009-20ebb0f2a09e/go.mod h1:pJLUxLENpZxwdsKMEsNbx1VGcRFpLqf3715MtcvvzbA=
github.com/pmezard/go-difflib v1.0.0 h1:4DBwDE0NGyQoBHbLQYPwSUPoCMWR5BEzIk/f1lZbAQM=
github.com/pmezard/go-difflib v1.0.0/go.mod h1:iKH77koFhYxTK1pcRnkKkqfTogsbg7gZNVY4sRDYZ/4=
github.com/rogpeppe/go-internal v1.9.0/go.mod h1:WtVeX8xhTBvf0smdhujwtBcq4Qrzq/fJaraNFVN+nFs=
github.com/rogpeppe/go-internal v1.11.0 h1:cWPaGQEPrBb5/AsnsZesgZZ9yb1OQ+GOISoDNXVBh4M=
github.com/rogpeppe/go-internal v1.11.0/go.mod h1:ddIwULY96R17DhadqLgMfk9H9tvdUzkipdSkR5nkCZA=
github.com/stretchr/objx v0.1.0/go.mod h1:HFkY916IF+rwdDfMAkV7OtwuqBVzrE8GR6GFx+wExME=
github.com/stretchr/objx v0.4.0/go.mod h1:YvHI0jy2hoMjB+UWwv71VJQ9isScKT/TqJzVSSt89Yw=
github.com/stretchr/objx v0.5.0/go.mod h1:Yh+to48EsGEfYuaHDzXPcE3xhTkx73EhmCGUpEOglKo=
github.com/stretchr/objx v0.5.2/go.mod h1:FRsXN1f5AsAjCGJKqEizvkpNtU+EGNCLh3NxZ/8L+MA=
github.com/stretchr/testify v1.3.0/go.mod h1:M5WIy9Dh21IEIfnGCwXGc5bZfKNJtfHm1UVUgZn+9EI=
github.com/stretchr/testify v1.7.0/go.mod h1:6Fq8oRcR53rry900zMqJjRRixrwX3KX962/h/Wwjteg=
github.com/stretchr/testify v1.7.1/go.mod h1:6Fq8oRcR53rry900zMqJjRRixrwX3KX962/h/Wwjteg=
github.com/stretchr/testify v1.8.0/go.mod h1:yNjHg4UonilssWZ8iaSj1OCr/vHnekPRkoO+kdMU+MU=
github.com/stretchr/testify v1.8.1/go.mod h1:w2LPCIKwWwSfY2zedu0+kehJoqGctiVI29o6fzry7u4=
github.com/stretchr/testify v1.8.4/go.mod h1:sz/lmYIOXD/1dqDmKjjqLyZ2RngseejIcXlSw2iwfAo=
github.com/stretchr/testify v1.9.0 h1:HtqpIVDClZ4nwg75+f6Lvsy/wHu+3BoSGCbBAcpTsTg=
github.com/stretchr/testify v1.9.0/go.mod h1:r2ic/lqez/lEtzL7wO/rwa5dbSLXVDPFyf8C91i36aY=
github.com/twitchyliquid64/golang-asm v0.15.1 h1:SU5vSMR7hnwNxj24w34ZyCi/FmDZTkS4MhqMhdFk5YI=
github.com/twitchyliquid64/golang-asm v0.15.1/go.mod h1:a1lVb/DtPvCB8fslRZhAngC2+aY1QWCk3Cedj/Gdt08=
github.com/ugorji/go/codec v1.2.12 h1:9LC83zGrHhuUA9l16C9AHXAqEV/2wBQ4nkvumAE65EE=
github.com/ugorji/go/codec v1.2.12/go.mod h1:UNopzCgEMSXjBc6AOMqYvWC1ktqTAfzJZUZgYf6w6lg=
golang.org/x/arch v0.0.0-20210923205945-b76863e36670/go.mod h1:5om86z9Hs0C8fWVUuoMHwpExlXzs5Tkyp9hOrfG7pp8=
golang.org/x/arch v0.8.0 h1:3wRIsP3pM4yUptoR96otTUOXI367OS0+c9eeRi9doIc=
golang.org/x/arch v0.8.0/go.mod h1:FEVrYAQjsQXMVJ1nsMoVVXPZg6p2JE2mx8psSWTDQys=
golang.org/x/crypto v0.25.0 h1:ypSNr+bnYL2YhwoMt2zPxHFmbAN1KZs/njMG3hxUp30=
golang.org/x/crypto v0.25.0/go.mod h1:T+wALwcMOSE0kXgUAnPAHqTLW+XHgcELELW8VaDgm/M=
golang.org/x/net v0.27.0 h1:5K3Njcw06/l2y9vpGCSdcxWOYHOUk3dVNGDXN+FvAys=
golang.org/x/net v0.27.0/go.mod h1:dDi0PyhWNoiUOrAS8uXv/vnScO4wnHQO4mj9fn/RytE=
golang.org/x/sys v0.5.0/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
golang.org/x/sys v0.6.0/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
golang.org/x/sys v0.22.0 h1:RI27ohtqKCnwULzJLqkv897zojh5/DwS/ENaMzUOaWI=
golang.org/x/sys v0.22.0/go.mod h1:/VUhepiaJMQUp4+oa/7Zr1D23ma6VTLIYjOOTFZPUcA=
golang.org/x/text v0.16.0 h1:a94ExnEXNtEwYLGJSIUxnWoxoRz/ZcCsV63ROupILh4=
golang.org/x/text v0.16.0/go.mod h1:GhwF1Be+LQoKShO3cGOHzqOgRrGaYc9AvblQOmPVHnI=
google.golang.org/protobuf v1.34.2 h1:6xV6lTsCfpGD21XK49h7MhtcApnLqkfYgPcdHftf6hg=
google.golang.org/protobuf v1.34.2/go.mod h1:qYOHts0dSfpeUzUFpOMr/WGzszTmLH+DiWniOlNbLDw=
gopkg.in/check.v1 v0.0.0-20161208181325-20d25e280405/go.mod h1:Co6ibVJAznAaIkqp8huTwlJQCZ016jof/cbN4VW5Yz0=
gopkg.in/check.v1 v1.0.0-20201130134442-10cb98267c6c h1:Hei/4ADfdWqJk1ZMxUNpqntNwaWcugrBjAiHlqqRiVk=
gopkg.in/check.v1 v1.0.0-20201130134442-10cb98267c6c/go.mod h1:JHkPIbrfpd72SG/EVd6muEfDQjcINNoR0C8j2r3qZ4Q=
gopkg.in/yaml.v3 v3.0.0-20200313102051-9f266ea9e77c/go.mod h1:K4uyk7z7BCEPqu6E+C64Yfv1cQ7kz7rIZviUmN+EgEM=
gopkg.in/yaml.v3 v3.0.1 h1:fxVm/GzAzEWqLHuvctI91KS9hhNmmWOoWu0XTYJS7CA=
gopkg.in/yaml.v3 v3.0.1/go.mod h1:K4uyk7z7BCEPqu6E+C64Yfv1cQ7kz7rIZviUmN+EgEM=
merak.axiomatrix.org/Axiomatrix_Org/optimized_go_tools v0.0.0-20240806071711-ae889abd1da4 h1:lS9uvcRVFdKZbwBQDpB3td4tmkx8azO3iMRMEfhhKm8=
merak.axiomatrix.org/Axiomatrix_Org/optimized_go_tools v0.0.0-20240806071711-ae889abd1da4/go.mod h1:cvBj2+/c+dVVR2KiUQfuMtXGU8sYEQG1TxOmp5T8os8=
nullprogram.com/x/optparse v1.0.0/go.mod h1:KdyPE+Igbe0jQUrVfMqDMeJQIJZEuyV7pjYmp6pbG50=
rsc.io/pdf v0.1.1/go.mod h1:n8OzWcQ6Sp37PL01nO98y4iUCRdTGarVfzxY20ICaU4=

175
main.go Normal file
View File

@ -0,0 +1,175 @@
package main
import (
"encoding/json"
"github.com/gin-gonic/gin"
"math/rand"
"merak.axiomatrix.org/Axiomatrix_Org/optimized_go_tools/am_cors"
"merak.axiomatrix.org/Axiomatrix_Org/optimized_go_tools/am_ratelimit"
"os"
"path/filepath"
"strconv"
"strings"
"time"
)
type Data struct {
UUID string `json:"uuid"`
Sentence string `json:"sentence"`
Type string `json:"type"`
From string `json:"from"`
CreatedAt uint `json:"created_at"`
Length int `json:"length"`
}
var dataDir = "./data"
var dataTypes = []string{"internet", "literature", "philosophy", "poem"}
var defaultLimitConfig = am_ratelimit.NewRateLimitConfig(5, 1)
func main() {
gin.SetMode(gin.ReleaseMode)
r := gin.Default()
r.Use(am_cors.Cors())
r.GET("/", defaultLimitConfig.RateLimitMiddleware, func(c *gin.Context) {
t := c.Query("type") // 要求的語料類型
lang := c.Query("lang") // 简体中文 / 繁體中文
ls := c.Query("length") // 要求的語料最大長度
var l int
ns := c.Query("number") // 要求的語料數量
var n int
var dataDirNew string
if lang == "zh-CN" {
dataDirNew = filepath.Join(dataDir, "zh-CN")
} else if lang == "zh-TW" {
dataDirNew = filepath.Join(dataDir, "zh-TW")
} else {
if lang == "" {
dataDirNew = filepath.Join(dataDir, "zh-TW")
} else {
c.JSON(400, gin.H{"error": "invalid lang"})
return
}
}
if ls != "" {
atoi, err := strconv.Atoi(ls)
if err != nil {
c.JSON(500, gin.H{"error": err.Error()})
return
}
l = atoi
} else {
l = 100000000
}
if ns != "" {
atoi, err := strconv.Atoi(ns)
if err != nil {
c.JSON(500, gin.H{"error": err.Error()})
return
}
n = atoi
} else {
n = 1
}
var r int // 符合要求的語料庫長度
var contents []Data // 符合要求的語料庫
if t == "" { // 未指定語料類型,則從所有語料中隨機選取
files, err := os.ReadDir(dataDirNew)
if err != nil {
c.JSON(500, gin.H{"error": err.Error()})
return
}
for _, file := range files {
filePath := filepath.Join(dataDirNew, file.Name())
datas, err := GetFile(filePath)
if err != nil {
c.JSON(500, gin.H{"error": err.Error()})
return
}
contents = append(contents, datas...)
}
r = len(contents)
} else {
ts := strings.Split(t, ",")
for _, t := range ts {
if !Contains(dataTypes, t) {
c.JSON(400, gin.H{"error": "invalid type"})
return
}
}
files, err := os.ReadDir(dataDirNew)
if err != nil {
c.JSON(500, gin.H{"error": err.Error()})
return
}
for _, file := range files {
if Contains(ts, strings.TrimSuffix(file.Name(), ".json")) {
filePath := filepath.Join(dataDirNew, file.Name())
datas, err := GetFile(filePath)
if err != nil {
c.JSON(500, gin.H{"error": err.Error()})
return
}
contents = append(contents, datas...)
}
}
r = len(contents)
}
// 隨機產生語料
var results []Data
for i := 0; i < n; i++ {
var result Data
for {
random := rand.New(rand.NewSource(time.Now().UnixNano()))
randN := random.Intn(r)
content := contents[randN]
if content.Length <= l {
result = content
break
}
}
results = append(results, result)
}
c.JSON(200, results)
})
err := r.Run(":7080")
if err != nil {
panic(err)
}
}
func GetFile(filePath string) ([]Data, error) {
content, err := os.ReadFile(filePath)
if err != nil {
return nil, err
}
var datas []Data
err = json.Unmarshal(content, &datas)
if err != nil {
return nil, err
}
return datas, nil
}
func Contains(arr []string, target string) bool {
for _, a := range arr {
if a == target {
return true
}
}
return false
}