commit 40e207bdb2ad5d7e165d245208f97bcd85ebbcfa Author: Anton Vakhrushev Date: Fri Aug 8 11:13:35 2025 +0300 Init: generated with claude-sonnet-4 diff --git a/.gitignore b/.gitignore new file mode 100644 index 0000000..4e29a03 --- /dev/null +++ b/.gitignore @@ -0,0 +1,51 @@ +# Binaries for programs and plugins +*.exe +*.exe~ +*.dll +*.so +*.dylib + +# Test binary, built with `go test -c` +*.test + +# Output of the go coverage tool, specifically when used with LiteIDE +*.out + +# Dependency directories (remove the comment below to include it) +# vendor/ + +# Go workspace file +go.work + +# Database files +data/transcriber.db +data/transcriber.db-shm +data/transcriber.db-wal + +# Uploaded files +data/files/* +!data/files/.gitkeep + +# IDE files +.vscode/ +.idea/ +*.swp +*.swo +*~ + +# OS generated files +.DS_Store +.DS_Store? +._* +.Spotlight-V100 +.Trashes +ehthumbs.db +Thumbs.db + +# Log files +*.log + +# Environment files +.env +.env.local +.env.*.local diff --git a/README.md b/README.md new file mode 100644 index 0000000..148a476 --- /dev/null +++ b/README.md @@ -0,0 +1,146 @@ +# Transcriber Service + +Сервис для расшифровки аудиозаписей с REST API. + +## Возможности + +- Загрузка аудиофайлов любого формата +- Автоматическая генерация UUID для файлов +- Сохранение файлов на диск +- Отслеживание статуса задач расшифровки +- SQLite база данных для хранения метаданных + +## Технологии + +- **Веб-фреймворк**: gin-gonic/gin +- **SQL Builder**: doug-martin/goqu +- **Миграции БД**: pressly/goose +- **База данных**: SQLite +- **UUID**: google/uuid + +## Установка и запуск + +1. Клонируйте репозиторий +2. Установите зависимости: + ```bash + go mod tidy + ``` +3. Запустите приложение: + ```bash + go run main.go + ``` + +Сервер запустится на порту 8080. + +## API Endpoints + +### POST /api/transcribe + +Загружает аудиофайл и создает задачу на расшифровку. + +**Параметры:** +- `audio` (form-data) - аудиофайл для расшифровки + +**Пример запроса:** +```bash +curl -X POST \ + http://localhost:8080/api/transcribe \ + -F "audio=@/path/to/your/audio.mp3" +``` + +**Ответ:** +```json +{ + "job_id": "550e8400-e29b-41d4-a716-446655440000", + "file_id": "6ba7b810-9dad-11d1-80b4-00c04fd430c8", + "status": "pending" +} +``` + +### GET /api/transcribe/:id + +Получает статус задачи расшифровки по ID. + +**Пример запроса:** +```bash +curl http://localhost:8080/api/transcribe/550e8400-e29b-41d4-a716-446655440000 +``` + +**Ответ:** +```json +{ + "id": "550e8400-e29b-41d4-a716-446655440000", + "status": "pending", + "file_id": "6ba7b810-9dad-11d1-80b4-00c04fd430c8", + "created_at": "2024-01-01T12:00:00Z", + "updated_at": "2024-01-01T12:00:00Z" +} +``` + +### GET /health + +Проверка работоспособности сервиса. + +**Ответ:** +```json +{ + "status": "ok", + "message": "Transcriber service is running" +} +``` + +## Статусы задач + +- `pending` - задача создана, ожидает обработки +- `processing` - задача выполняется +- `completed` - задача завершена успешно +- `failed` - задача завершена с ошибкой + +## Структура проекта + +``` +transcriber/ +├── main.go # Точка входа приложения +├── go.mod # Зависимости Go +├── models/ +│ └── models.go # Модели данных +├── database/ +│ └── database.go # Слой работы с БД +├── handlers/ +│ └── transcribe.go # HTTP обработчики +├── migrations/ +│ ├── 001_create_files_table.sql +│ └── 002_create_transcribe_jobs_table.sql +└── data/ + ├── files/ # Директория для сохранения файлов + └── transcriber.db # SQLite база данных (создается автоматически) +``` + +## База данных + +### Таблица `files` +- `id` (TEXT) - UUID файла +- `type` (TEXT) - MIME-тип файла +- `size` (INTEGER) - размер файла в байтах +- `created_at` (DATETIME) - время создания + +### Таблица `transcribe_jobs` +- `id` (TEXT) - UUID задачи +- `status` (TEXT) - статус задачи +- `file_id` (TEXT) - ссылка на файл +- `created_at` (DATETIME) - время создания +- `updated_at` (DATETIME) - время последнего обновления + +## Разработка + +Для добавления новых миграций используйте goose: + +```bash +# Создание новой миграции +goose -dir migrations create migration_name sql + +# Применение миграций +goose -dir migrations sqlite3 data/transcriber.db up + +# Откат миграций +goose -dir migrations sqlite3 data/transcriber.db down diff --git a/database/database.go b/database/database.go new file mode 100644 index 0000000..3b41000 --- /dev/null +++ b/database/database.go @@ -0,0 +1,117 @@ +package database + +import ( + "database/sql" + "fmt" + "log" + + "git.vakhrushev.me/av/transcriber/models" + "github.com/doug-martin/goqu/v9" + _ "github.com/doug-martin/goqu/v9/dialect/sqlite3" + _ "github.com/mattn/go-sqlite3" + "github.com/pressly/goose/v3" +) + +type DB struct { + conn *sql.DB + gq *goqu.Database +} + +func New(dbPath string) (*DB, error) { + conn, err := sql.Open("sqlite3", dbPath) + if err != nil { + return nil, fmt.Errorf("failed to open database: %w", err) + } + + if err := conn.Ping(); err != nil { + return nil, fmt.Errorf("failed to ping database: %w", err) + } + + gq := goqu.New("sqlite3", conn) + + db := &DB{ + conn: conn, + gq: gq, + } + + return db, nil +} + +func (db *DB) RunMigrations(migrationsDir string) error { + if err := goose.SetDialect("sqlite3"); err != nil { + return fmt.Errorf("failed to set goose dialect: %w", err) + } + + if err := goose.Up(db.conn, migrationsDir); err != nil { + return fmt.Errorf("failed to run migrations: %w", err) + } + + log.Println("Migrations completed successfully") + return nil +} + +func (db *DB) Close() error { + return db.conn.Close() +} + +func (db *DB) CreateFile(file *models.File) error { + query := db.gq.Insert("files").Rows(file) + sql, args, err := query.ToSQL() + if err != nil { + return fmt.Errorf("failed to build query: %w", err) + } + + _, err = db.conn.Exec(sql, args...) + if err != nil { + return fmt.Errorf("failed to insert file: %w", err) + } + + return nil +} + +func (db *DB) CreateTranscribeJob(job *models.TranscribeJob) error { + query := db.gq.Insert("transcribe_jobs").Rows(job) + sql, args, err := query.ToSQL() + if err != nil { + return fmt.Errorf("failed to build query: %w", err) + } + + _, err = db.conn.Exec(sql, args...) + if err != nil { + return fmt.Errorf("failed to insert transcribe job: %w", err) + } + + return nil +} + +func (db *DB) GetFileByID(id string) (*models.File, error) { + query := db.gq.From("files").Where(goqu.C("id").Eq(id)) + sql, args, err := query.ToSQL() + if err != nil { + return nil, fmt.Errorf("failed to build query: %w", err) + } + + var file models.File + err = db.conn.QueryRow(sql, args...).Scan(&file.ID, &file.Type, &file.Size, &file.CreatedAt) + if err != nil { + return nil, fmt.Errorf("failed to get file: %w", err) + } + + return &file, nil +} + +func (db *DB) GetTranscribeJobByID(id string) (*models.TranscribeJob, error) { + query := db.gq.From("transcribe_jobs").Where(goqu.C("id").Eq(id)) + sql, args, err := query.ToSQL() + if err != nil { + return nil, fmt.Errorf("failed to build query: %w", err) + } + + var job models.TranscribeJob + err = db.conn.QueryRow(sql, args...).Scan(&job.ID, &job.Status, &job.FileID, &job.CreatedAt, &job.UpdatedAt) + if err != nil { + return nil, fmt.Errorf("failed to get transcribe job: %w", err) + } + + return &job, nil +} diff --git a/go.mod b/go.mod new file mode 100644 index 0000000..4ac26fd --- /dev/null +++ b/go.mod @@ -0,0 +1,40 @@ +module git.vakhrushev.me/av/transcriber + +go 1.24.5 + +require ( + github.com/doug-martin/goqu/v9 v9.19.0 + github.com/gin-gonic/gin v1.10.1 + github.com/google/uuid v1.4.0 + github.com/mattn/go-sqlite3 v1.14.17 + github.com/pressly/goose/v3 v3.15.1 +) + +require ( + github.com/bytedance/sonic v1.11.6 // indirect + github.com/bytedance/sonic/loader v0.1.1 // indirect + github.com/cloudwego/base64x v0.1.4 // indirect + github.com/cloudwego/iasm v0.2.0 // indirect + github.com/gabriel-vasile/mimetype v1.4.3 // indirect + github.com/gin-contrib/sse v0.1.0 // indirect + github.com/go-playground/locales v0.14.1 // indirect + github.com/go-playground/universal-translator v0.18.1 // indirect + github.com/go-playground/validator/v10 v10.20.0 // indirect + github.com/goccy/go-json v0.10.2 // indirect + github.com/json-iterator/go v1.1.12 // indirect + github.com/klauspost/cpuid/v2 v2.2.7 // indirect + github.com/leodido/go-urn v1.4.0 // indirect + github.com/mattn/go-isatty v0.0.20 // indirect + github.com/modern-go/concurrent v0.0.0-20180306012644-bacd9c7ef1dd // indirect + github.com/modern-go/reflect2 v1.0.2 // indirect + github.com/pelletier/go-toml/v2 v2.2.2 // indirect + github.com/twitchyliquid64/golang-asm v0.15.1 // indirect + github.com/ugorji/go/codec v1.2.12 // indirect + golang.org/x/arch v0.8.0 // indirect + golang.org/x/crypto v0.23.0 // indirect + golang.org/x/net v0.25.0 // indirect + golang.org/x/sys v0.20.0 // indirect + golang.org/x/text v0.15.0 // indirect + google.golang.org/protobuf v1.34.1 // indirect + gopkg.in/yaml.v3 v3.0.1 // indirect +) diff --git a/go.sum b/go.sum new file mode 100644 index 0000000..9d8df83 --- /dev/null +++ b/go.sum @@ -0,0 +1,144 @@ +github.com/DATA-DOG/go-sqlmock v1.5.0 h1:Shsta01QNfFxHCfpW6YH2STWB0MudeXXEWMr20OEh60= +github.com/DATA-DOG/go-sqlmock v1.5.0/go.mod h1:f/Ixk793poVmq4qj/V1dPUg2JEAKC73Q5eFN3EC/SaM= +github.com/bytedance/sonic v1.11.6 h1:oUp34TzMlL+OY1OUWxHqsdkgC/Zfc85zGqw9siXjrc0= +github.com/bytedance/sonic v1.11.6/go.mod h1:LysEHSvpvDySVdC2f87zGWf6CIKJcAvqab1ZaiQtds4= +github.com/bytedance/sonic/loader v0.1.1 h1:c+e5Pt1k/cy5wMveRDyk2X4B9hF4g7an8N3zCYjJFNM= +github.com/bytedance/sonic/loader v0.1.1/go.mod h1:ncP89zfokxS5LZrJxl5z0UJcsk4M4yY2JpfqGeCtNLU= +github.com/cloudwego/base64x v0.1.4 h1:jwCgWpFanWmN8xoIUHa2rtzmkd5J2plF/dnLS6Xd/0Y= +github.com/cloudwego/base64x v0.1.4/go.mod h1:0zlkT4Wn5C6NdauXdJRhSKRlJvmclQ1hhJgA0rcu/8w= +github.com/cloudwego/iasm v0.2.0 h1:1KNIy1I1H9hNNFEEH3DVnI4UujN+1zjpuk6gwHLTssg= +github.com/cloudwego/iasm v0.2.0/go.mod h1:8rXZaNYT2n95jn+zTI1sDr+IgcD2GVs0nlbbQPiEFhY= +github.com/davecgh/go-spew v1.1.0/go.mod h1:J7Y8YcW2NihsgmVo/mv3lAwl/skON4iLHjSsI+c5H38= +github.com/davecgh/go-spew v1.1.1 h1:vj9j/u1bqnvCEfJOwUhtlOARqs3+rkHYY13jYWTU97c= +github.com/davecgh/go-spew v1.1.1/go.mod h1:J7Y8YcW2NihsgmVo/mv3lAwl/skON4iLHjSsI+c5H38= +github.com/denisenkom/go-mssqldb v0.10.0/go.mod h1:xbL0rPBG9cCiLr28tMa8zpbdarY27NDyej4t/EjAShU= +github.com/doug-martin/goqu/v9 v9.19.0 h1:PD7t1X3tRcUiSdc5TEyOFKujZA5gs3VSA7wxSvBx7qo= +github.com/doug-martin/goqu/v9 v9.19.0/go.mod h1:nf0Wc2/hV3gYK9LiyqIrzBEVGlI8qW3GuDCEobC4wBQ= +github.com/dustin/go-humanize v1.0.1 h1:GzkhY7T5VNhEkwH0PVJgjz+fX1rhBrR7pRT3mDkpeCY= +github.com/dustin/go-humanize v1.0.1/go.mod h1:Mu1zIs6XwVuF/gI1OepvI0qD18qycQx+mFykh5fBlto= +github.com/gabriel-vasile/mimetype v1.4.3 h1:in2uUcidCuFcDKtdcBxlR0rJ1+fsokWf+uqxgUFjbI0= +github.com/gabriel-vasile/mimetype v1.4.3/go.mod h1:d8uq/6HKRL6CGdk+aubisF/M5GcPfT7nKyLpA0lbSSk= +github.com/gin-contrib/sse v0.1.0 h1:Y/yl/+YNO8GZSjAhjMsSuLt29uWRFHdHYUb5lYOV9qE= +github.com/gin-contrib/sse v0.1.0/go.mod h1:RHrZQHXnP2xjPF+u1gW/2HnVO7nvIa9PG3Gm+fLHvGI= +github.com/gin-gonic/gin v1.10.1 h1:T0ujvqyCSqRopADpgPgiTT63DUQVSfojyME59Ei63pQ= +github.com/gin-gonic/gin v1.10.1/go.mod h1:4PMNQiOhvDRa013RKVbsiNwoyezlm2rm0uX/T7kzp5Y= +github.com/go-playground/assert/v2 v2.2.0 h1:JvknZsQTYeFEAhQwI4qEt9cyV5ONwRHC+lYKSsYSR8s= +github.com/go-playground/assert/v2 v2.2.0/go.mod h1:VDjEfimB/XKnb+ZQfWdccd7VUvScMdVu0Titje2rxJ4= +github.com/go-playground/locales v0.14.1 h1:EWaQ/wswjilfKLTECiXz7Rh+3BjFhfDFKv/oXslEjJA= +github.com/go-playground/locales v0.14.1/go.mod h1:hxrqLVvrK65+Rwrd5Fc6F2O76J/NuW9t0sjnWqG1slY= +github.com/go-playground/universal-translator v0.18.1 h1:Bcnm0ZwsGyWbCzImXv+pAJnYK9S473LQFuzCbDbfSFY= +github.com/go-playground/universal-translator v0.18.1/go.mod h1:xekY+UJKNuX9WP91TpwSH2VMlDf28Uj24BCp08ZFTUY= +github.com/go-playground/validator/v10 v10.20.0 h1:K9ISHbSaI0lyB2eWMPJo+kOS/FBExVwjEviJTixqxL8= +github.com/go-playground/validator/v10 v10.20.0/go.mod h1:dbuPbCMFw/DrkbEynArYaCwl3amGuJotoKCe95atGMM= +github.com/go-sql-driver/mysql v1.6.0/go.mod h1:DCzpHaOWr8IXmIStZouvnhqoel9Qv2LBy8hT2VhHyBg= +github.com/goccy/go-json v0.10.2 h1:CrxCmQqYDkv1z7lO7Wbh2HN93uovUHgrECaO5ZrCXAU= +github.com/goccy/go-json v0.10.2/go.mod h1:6MelG93GURQebXPDq3khkgXZkazVtN9CRI+MGFi0w8I= +github.com/golang-sql/civil v0.0.0-20190719163853-cb61b32ac6fe/go.mod h1:8vg3r2VgvsThLBIFL93Qb5yWzgyZWhEmBwUJWevAkK0= +github.com/google/go-cmp v0.5.5 h1:Khx7svrCpmxxtHBq5j2mp/xVjsi8hQMfNLvJFAlrGgU= +github.com/google/go-cmp v0.5.5/go.mod h1:v8dTdLbMG2kIc/vJvl+f65V22dbkXbowE6jgT/gNBxE= +github.com/google/gofuzz v1.0.0/go.mod h1:dBl0BpW6vV/+mYPU4Po3pmUjxk6FQPldtuIdl/M65Eg= +github.com/google/uuid v1.4.0 h1:MtMxsa51/r9yyhkyLsVeVt0B+BGQZzpQiTQ4eHZ8bc4= +github.com/google/uuid v1.4.0/go.mod h1:TIyPZe4MgqvfeYDBFedMoGGpEw/LqOeaOT+nhxU+yHo= +github.com/json-iterator/go v1.1.12 h1:PV8peI4a0ysnczrg+LtxykD8LfKY9ML6u2jnxaEnrnM= +github.com/json-iterator/go v1.1.12/go.mod h1:e30LSqwooZae/UwlEbR2852Gd8hjQvJoHmT4TnhNGBo= +github.com/kballard/go-shellquote v0.0.0-20180428030007-95032a82bc51 h1:Z9n2FFNUXsshfwJMBgNA0RU6/i7WVaAegv3PtuIHPMs= +github.com/kballard/go-shellquote v0.0.0-20180428030007-95032a82bc51/go.mod h1:CzGEWj7cYgsdH8dAjBGEr58BoE7ScuLd+fwFZ44+/x8= +github.com/klauspost/cpuid/v2 v2.0.9/go.mod h1:FInQzS24/EEf25PyTYn52gqo7WaD8xa0213Md/qVLRg= +github.com/klauspost/cpuid/v2 v2.2.7 h1:ZWSB3igEs+d0qvnxR/ZBzXVmxkgt8DdzP6m9pfuVLDM= +github.com/klauspost/cpuid/v2 v2.2.7/go.mod h1:Lcz8mBdAVJIBVzewtcLocK12l3Y+JytZYpaMropDUws= +github.com/knz/go-libedit v1.10.1/go.mod h1:MZTVkCWyz0oBc7JOWP3wNAzd002ZbM/5hgShxwh4x8M= +github.com/leodido/go-urn v1.4.0 h1:WT9HwE9SGECu3lg4d/dIA+jxlljEa1/ffXKmRjqdmIQ= +github.com/leodido/go-urn v1.4.0/go.mod h1:bvxc+MVxLKB4z00jd1z+Dvzr47oO32F/QSNjSBOlFxI= +github.com/lib/pq v1.10.1/go.mod h1:AlVN5x4E4T544tWzH6hKfbfQvm3HdbOxrmggDNAPY9o= +github.com/lib/pq v1.10.9 h1:YXG7RB+JIjhP29X+OtkiDnYaXQwpS4JEWq7dtCCRUEw= +github.com/lib/pq v1.10.9/go.mod h1:AlVN5x4E4T544tWzH6hKfbfQvm3HdbOxrmggDNAPY9o= +github.com/mattn/go-isatty v0.0.20 h1:xfD0iDuEKnDkl03q4limB+vH+GxLEtL/jb4xVJSWWEY= +github.com/mattn/go-isatty v0.0.20/go.mod h1:W+V8PltTTMOvKvAeJH7IuucS94S2C6jfK/D7dTCTo3Y= +github.com/mattn/go-sqlite3 v1.14.7/go.mod h1:NyWgC/yNuGj7Q9rpYnZvas74GogHl5/Z4A/KQRfk6bU= +github.com/mattn/go-sqlite3 v1.14.17 h1:mCRHCLDUBXgpKAqIKsaAaAsrAlbkeomtRFKXh2L6YIM= +github.com/mattn/go-sqlite3 v1.14.17/go.mod h1:2eHXhiwb8IkHr+BDWZGa96P6+rkvnG63S2DGjv9HUNg= +github.com/modern-go/concurrent v0.0.0-20180228061459-e0a39a4cb421/go.mod h1:6dJC0mAP4ikYIbvyc7fijjWJddQyLn8Ig3JB5CqoB9Q= +github.com/modern-go/concurrent v0.0.0-20180306012644-bacd9c7ef1dd h1:TRLaZ9cD/w8PVh93nsPXa1VrQ6jlwL5oN8l14QlcNfg= +github.com/modern-go/concurrent v0.0.0-20180306012644-bacd9c7ef1dd/go.mod h1:6dJC0mAP4ikYIbvyc7fijjWJddQyLn8Ig3JB5CqoB9Q= +github.com/modern-go/reflect2 v1.0.2 h1:xBagoLtFs94CBntxluKeaWgTMpvLxC4ur3nMaC9Gz0M= +github.com/modern-go/reflect2 v1.0.2/go.mod h1:yWuevngMOJpCy52FWWMvUC8ws7m/LJsjYzDa0/r8luk= +github.com/pelletier/go-toml/v2 v2.2.2 h1:aYUidT7k73Pcl9nb2gScu7NSrKCSHIDE89b3+6Wq+LM= +github.com/pelletier/go-toml/v2 v2.2.2/go.mod h1:1t835xjRzz80PqgE6HHgN2JOsmgYu/h4qDAS4n929Rs= +github.com/pmezard/go-difflib v1.0.0 h1:4DBwDE0NGyQoBHbLQYPwSUPoCMWR5BEzIk/f1lZbAQM= +github.com/pmezard/go-difflib v1.0.0/go.mod h1:iKH77koFhYxTK1pcRnkKkqfTogsbg7gZNVY4sRDYZ/4= +github.com/pressly/goose/v3 v3.15.1 h1:dKaJ1SdLvS/+HtS8PzFT0KBEtICC1jewLXM+b3emlv8= +github.com/pressly/goose/v3 v3.15.1/go.mod h1:0E3Yg/+EwYzO6Rz2P98MlClFgIcoujbVRs575yi3iIM= +github.com/remyoudompheng/bigfft v0.0.0-20230129092748-24d4a6f8daec h1:W09IVJc94icq4NjY3clb7Lk8O1qJ8BdBEF8z0ibU0rE= +github.com/remyoudompheng/bigfft v0.0.0-20230129092748-24d4a6f8daec/go.mod h1:qqbHyh8v60DhA7CoWK5oRCqLrMHRGoxYCSS9EjAz6Eo= +github.com/stretchr/objx v0.1.0/go.mod h1:HFkY916IF+rwdDfMAkV7OtwuqBVzrE8GR6GFx+wExME= +github.com/stretchr/objx v0.4.0/go.mod h1:YvHI0jy2hoMjB+UWwv71VJQ9isScKT/TqJzVSSt89Yw= +github.com/stretchr/objx v0.5.0/go.mod h1:Yh+to48EsGEfYuaHDzXPcE3xhTkx73EhmCGUpEOglKo= +github.com/stretchr/objx v0.5.2 h1:xuMeJ0Sdp5ZMRXx/aWO6RZxdr3beISkG5/G/aIRr3pY= +github.com/stretchr/objx v0.5.2/go.mod h1:FRsXN1f5AsAjCGJKqEizvkpNtU+EGNCLh3NxZ/8L+MA= +github.com/stretchr/testify v1.3.0/go.mod h1:M5WIy9Dh21IEIfnGCwXGc5bZfKNJtfHm1UVUgZn+9EI= +github.com/stretchr/testify v1.7.0/go.mod h1:6Fq8oRcR53rry900zMqJjRRixrwX3KX962/h/Wwjteg= +github.com/stretchr/testify v1.7.1/go.mod h1:6Fq8oRcR53rry900zMqJjRRixrwX3KX962/h/Wwjteg= +github.com/stretchr/testify v1.8.0/go.mod h1:yNjHg4UonilssWZ8iaSj1OCr/vHnekPRkoO+kdMU+MU= +github.com/stretchr/testify v1.8.1/go.mod h1:w2LPCIKwWwSfY2zedu0+kehJoqGctiVI29o6fzry7u4= +github.com/stretchr/testify v1.8.4/go.mod h1:sz/lmYIOXD/1dqDmKjjqLyZ2RngseejIcXlSw2iwfAo= +github.com/stretchr/testify v1.9.0 h1:HtqpIVDClZ4nwg75+f6Lvsy/wHu+3BoSGCbBAcpTsTg= +github.com/stretchr/testify v1.9.0/go.mod h1:r2ic/lqez/lEtzL7wO/rwa5dbSLXVDPFyf8C91i36aY= +github.com/twitchyliquid64/golang-asm v0.15.1 h1:SU5vSMR7hnwNxj24w34ZyCi/FmDZTkS4MhqMhdFk5YI= +github.com/twitchyliquid64/golang-asm v0.15.1/go.mod h1:a1lVb/DtPvCB8fslRZhAngC2+aY1QWCk3Cedj/Gdt08= +github.com/ugorji/go/codec v1.2.12 h1:9LC83zGrHhuUA9l16C9AHXAqEV/2wBQ4nkvumAE65EE= +github.com/ugorji/go/codec v1.2.12/go.mod h1:UNopzCgEMSXjBc6AOMqYvWC1ktqTAfzJZUZgYf6w6lg= +golang.org/x/arch v0.0.0-20210923205945-b76863e36670/go.mod h1:5om86z9Hs0C8fWVUuoMHwpExlXzs5Tkyp9hOrfG7pp8= +golang.org/x/arch v0.8.0 h1:3wRIsP3pM4yUptoR96otTUOXI367OS0+c9eeRi9doIc= +golang.org/x/arch v0.8.0/go.mod h1:FEVrYAQjsQXMVJ1nsMoVVXPZg6p2JE2mx8psSWTDQys= +golang.org/x/crypto v0.0.0-20190308221718-c2843e01d9a2/go.mod h1:djNgcEr1/C05ACkg1iLfiJU5Ep61QUkGW8qpdssI0+w= +golang.org/x/crypto v0.0.0-20190325154230-a5d413f7728c/go.mod h1:djNgcEr1/C05ACkg1iLfiJU5Ep61QUkGW8qpdssI0+w= +golang.org/x/crypto v0.0.0-20190605123033-f99c8df09eb5/go.mod h1:yigFU9vqHzYiE8UmvKecakEJjdnWj3jj499lnFckfCI= +golang.org/x/crypto v0.23.0 h1:dIJU/v2J8Mdglj/8rJ6UUOM3Zc9zLZxVZwwxMooUSAI= +golang.org/x/crypto v0.23.0/go.mod h1:CKFgDieR+mRhux2Lsu27y0fO304Db0wZe70UKqHu0v8= +golang.org/x/mod v0.12.0 h1:rmsUpXtvNzj340zd98LZ4KntptpfRHwpFOHG188oHXc= +golang.org/x/mod v0.12.0/go.mod h1:iBbtSCu2XBx23ZKBPSOrRkjjQPZFPuis4dIYUhu/chs= +golang.org/x/net v0.0.0-20190404232315-eb5bcb51f2a3/go.mod h1:t9HGtf8HONx5eT2rtn7q6eTqICYqUVnKs3thJo3Qplg= +golang.org/x/net v0.25.0 h1:d/OCCoBEUq33pjydKrGQhw7IlUPI2Oylr+8qLx49kac= +golang.org/x/net v0.25.0/go.mod h1:JkAGAh7GEvH74S6FOH42FLoXpXbE/aqXSrIQjXgsiwM= +golang.org/x/sys v0.0.0-20190215142949-d0b11bdaac8a/go.mod h1:STP8DvDyc/dI5b8T5hshtkjS+E42TnysNCUPdjciGhY= +golang.org/x/sys v0.0.0-20190412213103-97732733099d/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs= +golang.org/x/sys v0.5.0/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg= +golang.org/x/sys v0.6.0/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg= +golang.org/x/sys v0.20.0 h1:Od9JTbYCk261bKm4M/mw7AklTlFYIa0bIp9BgSm1S8Y= +golang.org/x/sys v0.20.0/go.mod h1:/VUhepiaJMQUp4+oa/7Zr1D23ma6VTLIYjOOTFZPUcA= +golang.org/x/text v0.3.0/go.mod h1:NqM8EUOU14njkJ3fqMW+pc6Ldnwhi/IjpwHt7yyuwOQ= +golang.org/x/text v0.15.0 h1:h1V/4gjBv8v9cjcR6+AR5+/cIYK5N/WAgiv4xlsEtAk= +golang.org/x/text v0.15.0/go.mod h1:18ZOQIKpY8NJVqYksKHtTdi31H5itFRjB5/qKTNYzSU= +golang.org/x/tools v0.13.0 h1:Iey4qkscZuv0VvIt8E0neZjtPVQFSc870HQ448QgEmQ= +golang.org/x/tools v0.13.0/go.mod h1:HvlwmtVNQAhOuCjW7xxvovg8wbNq7LwfXh/k7wXUl58= +golang.org/x/xerrors v0.0.0-20191204190536-9bdfabe68543 h1:E7g+9GITq07hpfrRu66IVDexMakfv52eLZ2CXBWiKr4= +golang.org/x/xerrors v0.0.0-20191204190536-9bdfabe68543/go.mod h1:I/5z698sn9Ka8TeJc9MKroUUfqBBauWjQqLJ2OPfmY0= +google.golang.org/protobuf v1.34.1 h1:9ddQBjfCyZPOHPUiPxpYESBLc+T8P3E+Vo4IbKZgFWg= +google.golang.org/protobuf v1.34.1/go.mod h1:c6P6GXX6sHbq/GpV6MGZEdwhWPcYBgnhAHhKbcUYpos= +gopkg.in/check.v1 v0.0.0-20161208181325-20d25e280405 h1:yhCVgyC4o1eVCa2tZl7eS0r+SDo693bJlVdllGtEeKM= +gopkg.in/check.v1 v0.0.0-20161208181325-20d25e280405/go.mod h1:Co6ibVJAznAaIkqp8huTwlJQCZ016jof/cbN4VW5Yz0= +gopkg.in/yaml.v3 v3.0.0-20200313102051-9f266ea9e77c/go.mod h1:K4uyk7z7BCEPqu6E+C64Yfv1cQ7kz7rIZviUmN+EgEM= +gopkg.in/yaml.v3 v3.0.1 h1:fxVm/GzAzEWqLHuvctI91KS9hhNmmWOoWu0XTYJS7CA= +gopkg.in/yaml.v3 v3.0.1/go.mod h1:K4uyk7z7BCEPqu6E+C64Yfv1cQ7kz7rIZviUmN+EgEM= +lukechampine.com/uint128 v1.3.0 h1:cDdUVfRwDUDovz610ABgFD17nXD4/uDgVHl2sC3+sbo= +lukechampine.com/uint128 v1.3.0/go.mod h1:c4eWIwlEGaxC/+H1VguhU4PHXNWDCDMUlWdIWl2j1gk= +modernc.org/cc/v3 v3.41.0 h1:QoR1Sn3YWlmA1T4vLaKZfawdVtSiGx8H+cEojbC7v1Q= +modernc.org/cc/v3 v3.41.0/go.mod h1:Ni4zjJYJ04CDOhG7dn640WGfwBzfE0ecX8TyMB0Fv0Y= +modernc.org/ccgo/v3 v3.16.15 h1:KbDR3ZAVU+wiLyMESPtbtE/Add4elztFyfsWoNTgxS0= +modernc.org/ccgo/v3 v3.16.15/go.mod h1:yT7B+/E2m43tmMOT51GMoM98/MtHIcQQSleGnddkUNI= +modernc.org/libc v1.24.1 h1:uvJSeCKL/AgzBo2yYIPPTy82v21KgGnizcGYfBHaNuM= +modernc.org/libc v1.24.1/go.mod h1:FmfO1RLrU3MHJfyi9eYYmZBfi/R+tqZ6+hQ3yQQUkak= +modernc.org/mathutil v1.6.0 h1:fRe9+AmYlaej+64JsEEhoWuAYBkOtQiMEU7n/XgfYi4= +modernc.org/mathutil v1.6.0/go.mod h1:Ui5Q9q1TR2gFm0AQRqQUaBWFLAhQpCwNcuhBOSedWPo= +modernc.org/memory v1.7.2 h1:Klh90S215mmH8c9gO98QxQFsY+W451E8AnzjoE2ee1E= +modernc.org/memory v1.7.2/go.mod h1:NO4NVCQy0N7ln+T9ngWqOQfi7ley4vpwvARR+Hjw95E= +modernc.org/opt v0.1.3 h1:3XOZf2yznlhC+ibLltsDGzABUGVx8J6pnFMS3E4dcq4= +modernc.org/opt v0.1.3/go.mod h1:WdSiB5evDcignE70guQKxYUl14mgWtbClRi5wmkkTX0= +modernc.org/sqlite v1.26.0 h1:SocQdLRSYlA8W99V8YH0NES75thx19d9sB/aFc4R8Lw= +modernc.org/sqlite v1.26.0/go.mod h1:FL3pVXie73rg3Rii6V/u5BoHlSoyeZeIgKZEgHARyCU= +modernc.org/strutil v1.2.0 h1:agBi9dp1I+eOnxXeiZawM8F4LawKv4NzGWSaLfyeNZA= +modernc.org/strutil v1.2.0/go.mod h1:/mdcBmfOibveCTBxUl5B5l6W+TTH1FXPLHZE6bTosX0= +modernc.org/token v1.1.0 h1:Xl7Ap9dKaEs5kLoOQeQmPWevfnk/DM5qcLcYlA8ys6Y= +modernc.org/token v1.1.0/go.mod h1:UGzOrNV1mAFSEB63lOFHIpNRUVMvYTc6yu1SMY/XTDM= +nullprogram.com/x/optparse v1.0.0/go.mod h1:KdyPE+Igbe0jQUrVfMqDMeJQIJZEuyV7pjYmp6pbG50= +rsc.io/pdf v0.1.1/go.mod h1:n8OzWcQ6Sp37PL01nO98y4iUCRdTGarVfzxY20ICaU4= diff --git a/handlers/transcribe.go b/handlers/transcribe.go new file mode 100644 index 0000000..a71a148 --- /dev/null +++ b/handlers/transcribe.go @@ -0,0 +1,118 @@ +package handlers + +import ( + "fmt" + "io" + "net/http" + "os" + "path/filepath" + "time" + + "git.vakhrushev.me/av/transcriber/database" + "git.vakhrushev.me/av/transcriber/models" + "github.com/gin-gonic/gin" + "github.com/google/uuid" +) + +type TranscribeHandler struct { + db *database.DB +} + +func NewTranscribeHandler(db *database.DB) *TranscribeHandler { + return &TranscribeHandler{db: db} +} + +type TranscribeResponse struct { + JobID string `json:"job_id"` + FileID string `json:"file_id"` + Status string `json:"status"` +} + +func (h *TranscribeHandler) UploadAndTranscribe(c *gin.Context) { + // Получаем файл из формы + file, header, err := c.Request.FormFile("audio") + if err != nil { + c.JSON(http.StatusBadRequest, gin.H{"error": "No audio file provided"}) + return + } + defer file.Close() + + // Генерируем UUID для файла + fileID := uuid.New().String() + + // Определяем расширение файла + ext := filepath.Ext(header.Filename) + if ext == "" { + ext = ".audio" // fallback если расширение не определено + } + + // Создаем путь для сохранения файла + fileName := fmt.Sprintf("%s%s", fileID, ext) + filePath := filepath.Join("data", "files", fileName) + + // Создаем файл на диске + dst, err := os.Create(filePath) + if err != nil { + c.JSON(http.StatusInternalServerError, gin.H{"error": "Failed to create file"}) + return + } + defer dst.Close() + + // Копируем содержимое загруженного файла + size, err := io.Copy(dst, file) + if err != nil { + c.JSON(http.StatusInternalServerError, gin.H{"error": "Failed to save file"}) + return + } + + // Создаем запись в таблице files + fileRecord := &models.File{ + ID: fileID, + Type: header.Header.Get("Content-Type"), + Size: size, + CreatedAt: time.Now(), + } + + if err := h.db.CreateFile(fileRecord); err != nil { + // Удаляем файл если не удалось создать запись в БД + os.Remove(filePath) + c.JSON(http.StatusInternalServerError, gin.H{"error": "Failed to save file record"}) + return + } + + // Создаем запись в таблице transcribe_jobs + jobID := uuid.New().String() + job := &models.TranscribeJob{ + ID: jobID, + Status: models.StatusPending, + FileID: fileID, + CreatedAt: time.Now(), + UpdatedAt: time.Now(), + } + + if err := h.db.CreateTranscribeJob(job); err != nil { + c.JSON(http.StatusInternalServerError, gin.H{"error": "Failed to create transcribe job"}) + return + } + + // Возвращаем успешный ответ + response := TranscribeResponse{ + JobID: jobID, + FileID: fileID, + Status: models.StatusPending, + } + + c.JSON(http.StatusCreated, response) +} + +func (h *TranscribeHandler) GetJobStatus(c *gin.Context) { + jobID := c.Param("id") + + job, err := h.db.GetTranscribeJobByID(jobID) + if err != nil { + c.JSON(http.StatusNotFound, gin.H{"error": "Job not found"}) + return + } + + c.JSON(http.StatusOK, job) +} diff --git a/main.go b/main.go new file mode 100644 index 0000000..09d29db --- /dev/null +++ b/main.go @@ -0,0 +1,58 @@ +package main + +import ( + "log" + "os" + + "git.vakhrushev.me/av/transcriber/database" + "git.vakhrushev.me/av/transcriber/handlers" + "github.com/gin-gonic/gin" +) + +func main() { + // Создаем директории если они не существуют + if err := os.MkdirAll("data/files", 0755); err != nil { + log.Fatal("Failed to create data/files directory:", err) + } + + // Инициализируем базу данных + db, err := database.New("data/transcriber.db") + if err != nil { + log.Fatal("Failed to initialize database:", err) + } + defer db.Close() + + // Запускаем миграции + if err := db.RunMigrations("migrations"); err != nil { + log.Fatal("Failed to run migrations:", err) + } + + // Создаем Gin роутер + r := gin.Default() + + // Инициализируем обработчики + transcribeHandler := handlers.NewTranscribeHandler(db) + + // Настраиваем роуты + api := r.Group("/api") + { + api.POST("/transcribe", transcribeHandler.UploadAndTranscribe) + api.GET("/transcribe/:id", transcribeHandler.GetJobStatus) + } + + // Добавляем middleware для обработки больших файлов + r.MaxMultipartMemory = 32 << 20 // 32 MiB + + // Добавляем базовый роут для проверки работоспособности + r.GET("/health", func(c *gin.Context) { + c.JSON(200, gin.H{ + "status": "ok", + "message": "Transcriber service is running", + }) + }) + + log.Println("Starting server on :8080") + if err := r.Run(":8080"); err != nil { + log.Fatal("Failed to start server:", err) + } +} diff --git a/migrations/001_create_files_table.sql b/migrations/001_create_files_table.sql new file mode 100644 index 0000000..dbef4fb --- /dev/null +++ b/migrations/001_create_files_table.sql @@ -0,0 +1,10 @@ +-- +goose Up +CREATE TABLE files ( + id TEXT PRIMARY KEY, + type TEXT NOT NULL, + size INTEGER NOT NULL, + created_at DATETIME DEFAULT CURRENT_TIMESTAMP +); + +-- +goose Down +DROP TABLE files; diff --git a/migrations/002_create_transcribe_jobs_table.sql b/migrations/002_create_transcribe_jobs_table.sql new file mode 100644 index 0000000..bdbe8e1 --- /dev/null +++ b/migrations/002_create_transcribe_jobs_table.sql @@ -0,0 +1,12 @@ +-- +goose Up +CREATE TABLE transcribe_jobs ( + id TEXT PRIMARY KEY, + status TEXT NOT NULL DEFAULT 'pending', + file_id TEXT NOT NULL, + created_at DATETIME DEFAULT CURRENT_TIMESTAMP, + updated_at DATETIME DEFAULT CURRENT_TIMESTAMP, + FOREIGN KEY (file_id) REFERENCES files(id) +); + +-- +goose Down +DROP TABLE transcribe_jobs; diff --git a/models/models.go b/models/models.go new file mode 100644 index 0000000..e9d669d --- /dev/null +++ b/models/models.go @@ -0,0 +1,27 @@ +package models + +import ( + "time" +) + +type File struct { + ID string `db:"id" json:"id"` + Type string `db:"type" json:"type"` + Size int64 `db:"size" json:"size"` + CreatedAt time.Time `db:"created_at" json:"created_at"` +} + +type TranscribeJob struct { + ID string `db:"id" json:"id"` + Status string `db:"status" json:"status"` + FileID string `db:"file_id" json:"file_id"` + CreatedAt time.Time `db:"created_at" json:"created_at"` + UpdatedAt time.Time `db:"updated_at" json:"updated_at"` +} + +const ( + StatusPending = "pending" + StatusProcessing = "processing" + StatusCompleted = "completed" + StatusFailed = "failed" +)