-
Notifications
You must be signed in to change notification settings - Fork 7
/
manifest.yaml
74 lines (74 loc) · 1.96 KB
/
manifest.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
#You can edit this file at editor.swagger.io.
swagger: '2.0'
info:
x-21-github-profile-url:
x-21-github-project-url:
title: OCR to Speech
description: Performs OCR on an image to extract text, translate, and produce an audio clip.
termsOfService: https://opensource.org/licenses/MIT
x-21-usage: ''
x-21-quick-buy: "$ 21 buy http://<ZEROTIER IP>:6005/ocr2speech21?image_url=http://i.imgur.com/8nVmA6t.jpg --maxprice 20000 | jq -r '.data' | base64 --decode > output.wav\n# Note: run `sudo apt-get install jq` or `brew install jq` for Mac if jq is not already installed."
x-21-category: Utilities
x-21-app-image: ''
x-21-total-price:
min: 15000
max: 15000
contact: {name: Satoshi Nakamoto, email: [email protected]}
license:
name: MIT LICENSE
url: https://opensource.org/licenses/MIT
x-21-keywords:
- translation
- audio
- text
- image
- ocr
version: '0.1'
host: <ZEROTIER IP>:6005
schemes:
- http
basePath: /
x-21-manifest-path: /manifest
x-21-healthcheck-path: /healthy
paths:
/ocr2speech21:
get:
summary: Get an audio file reading text found in an image
produces:
- application/json
parameters:
- name: image
in: body
required: true
schema:
type: object
properties:
image_url:
type: string
responses:
200:
description: Audio file (base64 encoded)
schema:
type: object
properties:
data:
type: string
400:
description: Invalid input.
schema:
$ref: '#/definitions/InvalidInput'
500:
description: Error processing request.
schema:
$ref: '#/definitions/ProcessingError'
definitions:
InvalidInput:
type: object
properties:
error:
type: string
ProcessingError:
type: object
properties:
error:
type: string