|
11 | 11 | "name": "Apache 2.0", |
12 | 12 | "url": "https://www.apache.org/licenses/LICENSE-2.0" |
13 | 13 | }, |
14 | | - "version": "0.2.1" |
| 14 | + "version": "0.3.0" |
15 | 15 | }, |
16 | 16 | "paths": { |
17 | 17 | "/generate": { |
|
38 | 38 | "content": { |
39 | 39 | "application/json": { |
40 | 40 | "schema": { |
41 | | - "type": "array", |
42 | | - "items": { |
43 | | - "$ref": "#/components/schemas/GenerateResponse" |
44 | | - } |
| 41 | + "$ref": "#/components/schemas/GenerateResponse" |
45 | 42 | } |
46 | 43 | } |
47 | 44 | } |
|
51 | 48 | "content": { |
52 | 49 | "application/json": { |
53 | 50 | "schema": { |
54 | | - "type": "array", |
55 | | - "items": { |
56 | | - "$ref": "#/components/schemas/ErrorResponse" |
57 | | - } |
| 51 | + "$ref": "#/components/schemas/ErrorResponse" |
58 | 52 | }, |
59 | 53 | "example": { |
60 | 54 | "error": "Input validation error" |
|
67 | 61 | "content": { |
68 | 62 | "application/json": { |
69 | 63 | "schema": { |
70 | | - "type": "array", |
71 | | - "items": { |
72 | | - "$ref": "#/components/schemas/ErrorResponse" |
73 | | - } |
| 64 | + "$ref": "#/components/schemas/ErrorResponse" |
74 | 65 | }, |
75 | 66 | "example": { |
76 | 67 | "error": "Request failed during generation" |
|
83 | 74 | "content": { |
84 | 75 | "application/json": { |
85 | 76 | "schema": { |
86 | | - "type": "array", |
87 | | - "items": { |
88 | | - "$ref": "#/components/schemas/ErrorResponse" |
89 | | - } |
| 77 | + "$ref": "#/components/schemas/ErrorResponse" |
90 | 78 | }, |
91 | 79 | "example": { |
92 | 80 | "error": "Model is overloaded" |
|
99 | 87 | "content": { |
100 | 88 | "application/json": { |
101 | 89 | "schema": { |
102 | | - "type": "array", |
103 | | - "items": { |
104 | | - "$ref": "#/components/schemas/ErrorResponse" |
105 | | - } |
| 90 | + "$ref": "#/components/schemas/ErrorResponse" |
106 | 91 | }, |
107 | 92 | "example": { |
108 | 93 | "error": "Incomplete generation" |
|
136 | 121 | "200": { |
137 | 122 | "description": "Generated Text", |
138 | 123 | "content": { |
139 | | - "text/event-stream ": { |
| 124 | + "text/event-stream": { |
140 | 125 | "schema": { |
141 | | - "type": "array", |
142 | | - "items": { |
143 | | - "$ref": "#/components/schemas/StreamResponse" |
144 | | - } |
| 126 | + "$ref": "#/components/schemas/StreamResponse" |
145 | 127 | } |
146 | 128 | } |
147 | 129 | } |
148 | 130 | }, |
149 | 131 | "422": { |
150 | 132 | "description": "Input validation error", |
151 | 133 | "content": { |
152 | | - "text/event-stream ": { |
| 134 | + "text/event-stream": { |
153 | 135 | "schema": { |
154 | | - "type": "array", |
155 | | - "items": { |
156 | | - "$ref": "#/components/schemas/ErrorResponse" |
157 | | - } |
| 136 | + "$ref": "#/components/schemas/ErrorResponse" |
158 | 137 | }, |
159 | 138 | "example": { |
160 | 139 | "error": "Input validation error" |
|
165 | 144 | "424": { |
166 | 145 | "description": "Generation Error", |
167 | 146 | "content": { |
168 | | - "text/event-stream ": { |
| 147 | + "text/event-stream": { |
169 | 148 | "schema": { |
170 | | - "type": "array", |
171 | | - "items": { |
172 | | - "$ref": "#/components/schemas/ErrorResponse" |
173 | | - } |
| 149 | + "$ref": "#/components/schemas/ErrorResponse" |
174 | 150 | }, |
175 | 151 | "example": { |
176 | 152 | "error": "Request failed during generation" |
|
181 | 157 | "429": { |
182 | 158 | "description": "Model is overloaded", |
183 | 159 | "content": { |
184 | | - "text/event-stream ": { |
| 160 | + "text/event-stream": { |
185 | 161 | "schema": { |
186 | | - "type": "array", |
187 | | - "items": { |
188 | | - "$ref": "#/components/schemas/ErrorResponse" |
189 | | - } |
| 162 | + "$ref": "#/components/schemas/ErrorResponse" |
190 | 163 | }, |
191 | 164 | "example": { |
192 | 165 | "error": "Model is overloaded" |
|
197 | 170 | "500": { |
198 | 171 | "description": "Incomplete generation", |
199 | 172 | "content": { |
200 | | - "text/event-stream ": { |
| 173 | + "text/event-stream": { |
201 | 174 | "schema": { |
202 | | - "type": "array", |
203 | | - "items": { |
204 | | - "$ref": "#/components/schemas/ErrorResponse" |
205 | | - } |
| 175 | + "$ref": "#/components/schemas/ErrorResponse" |
206 | 176 | }, |
207 | 177 | "example": { |
208 | 178 | "error": "Incomplete generation" |
|
213 | 183 | }, |
214 | 184 | "deprecated": false |
215 | 185 | } |
| 186 | + }, |
| 187 | + "/metrics": { |
| 188 | + "get": { |
| 189 | + "tags": [ |
| 190 | + "Text Generation Inference" |
| 191 | + ], |
| 192 | + "summary": "Prometheus metrics scrape endpoint", |
| 193 | + "description": "Prometheus metrics scrape endpoint", |
| 194 | + "operationId": "metrics", |
| 195 | + "responses": { |
| 196 | + "200": { |
| 197 | + "description": "Prometheus Metrics", |
| 198 | + "content": { |
| 199 | + "text/plain": { |
| 200 | + "schema": { |
| 201 | + "type": "string" |
| 202 | + } |
| 203 | + } |
| 204 | + } |
| 205 | + } |
| 206 | + }, |
| 207 | + "deprecated": false |
| 208 | + } |
216 | 209 | } |
217 | 210 | }, |
218 | 211 | "components": { |
|
0 commit comments