|
237 | 237 | " ]\n", |
238 | 238 | " },\n", |
239 | 239 | " {\n", |
240 | | - " \"@odata.type\": \"#Microsoft.Skills.Text.LanguageDetectionSkill\",\n", |
241 | | - " \"context\": \"/document\",\n", |
242 | | - " \"description\": \"If you have multilingual content, adding a language code is useful for filtering\",\n", |
243 | | - " \"inputs\": [\n", |
244 | | - " {\n", |
245 | | - " \"name\": \"text\",\n", |
246 | | - " \"source\": \"/document/content\"\n", |
247 | | - " }\n", |
248 | | - " ],\n", |
249 | | - " \"outputs\": [\n", |
250 | | - " {\n", |
251 | | - " \"name\": \"languageCode\",\n", |
252 | | - " \"targetName\": \"language\"\n", |
253 | | - " }\n", |
254 | | - " ]\n", |
255 | | - " },\n", |
256 | | - " {\n", |
257 | 240 | " \"@odata.type\": \"#Microsoft.Skills.Text.SplitSkill\",\n", |
258 | 241 | " \"context\": \"/document\",\n", |
259 | 242 | " \"textSplitMode\": \"pages\",\n", |
|
263 | 246 | " {\n", |
264 | 247 | " \"name\": \"text\",\n", |
265 | 248 | " \"source\": \"/document/merged_text\"\n", |
266 | | - " },\n", |
267 | | - " {\n", |
268 | | - " \"name\": \"languageCode\",\n", |
269 | | - " \"source\": \"/document/language\"\n", |
270 | 249 | " }\n", |
271 | 250 | " ],\n", |
272 | 251 | " \"outputs\": [\n", |
|
285 | 264 | " {\n", |
286 | 265 | " \"name\": \"text\", \n", |
287 | 266 | " \"source\": \"/document/pages/*\"\n", |
288 | | - " },\n", |
289 | | - " {\n", |
290 | | - " \"name\": \"languageCode\",\n", |
291 | | - " \"source\": \"/document/language\"\n", |
292 | 267 | " }\n", |
293 | 268 | " ],\n", |
294 | 269 | " \"outputs\": [\n", |
|
308 | 283 | " {\n", |
309 | 284 | " \"name\": \"text\", \n", |
310 | 285 | " \"source\":\"/document/pages/*\"\n", |
311 | | - " },\n", |
312 | | - " {\n", |
313 | | - " \"name\": \"languageCode\",\n", |
314 | | - " \"source\": \"/document/language\"\n", |
315 | 286 | " }\n", |
316 | 287 | " ],\n", |
317 | 288 | " \"outputs\": [\n", |
|
387 | 358 | " {\"name\": \"title\", \"type\": \"Edm.String\", \"searchable\": \"true\", \"retrievable\": \"true\", \"facetable\": \"false\", \"filterable\": \"true\", \"sortable\": \"false\"},\n", |
388 | 359 | " {\"name\": \"content\", \"type\": \"Edm.String\", \"searchable\": \"true\", \"retrievable\": \"true\", \"sortable\": \"false\", \"filterable\": \"false\",\"facetable\": \"false\"},\n", |
389 | 360 | " {\"name\": \"chunks\",\"type\": \"Collection(Edm.String)\", \"searchable\": \"false\", \"retrievable\": \"true\", \"sortable\": \"false\", \"filterable\": \"false\", \"facetable\": \"false\"},\n", |
390 | | - " {\"name\": \"language\", \"type\": \"Edm.String\", \"searchable\": \"false\", \"retrievable\": \"true\", \"sortable\": \"true\", \"filterable\": \"true\", \"facetable\": \"true\"},\n", |
391 | 361 | " {\"name\": \"name\", \"type\": \"Edm.String\", \"searchable\": \"true\", \"retrievable\": \"true\", \"sortable\": \"false\", \"filterable\": \"false\", \"facetable\": \"false\"},\n", |
392 | 362 | " {\"name\": \"location\", \"type\": \"Edm.String\", \"searchable\": \"false\", \"retrievable\": \"true\", \"sortable\": \"false\", \"filterable\": \"false\", \"facetable\": \"false\"},\n", |
393 | 363 | " {\"name\": \"vectorized\", \"type\": \"Edm.Boolean\", \"searchable\": \"false\", \"retrievable\": \"true\", \"sortable\": \"false\", \"filterable\": \"false\", \"facetable\": \"false\"},\n", |
|
525 | 495 | " \"targetFieldName\" : \"images_text\"\n", |
526 | 496 | " },\n", |
527 | 497 | " {\n", |
528 | | - " \"sourceFieldName\": \"/document/language\",\n", |
529 | | - " \"targetFieldName\": \"language\"\n", |
530 | | - " },\n", |
531 | | - " {\n", |
532 | 498 | " \"sourceFieldName\": \"/document/pages/*/keyPhrases/*\",\n", |
533 | 499 | " \"targetFieldName\": \"keyPhrases\"\n", |
534 | 500 | " },\n", |
|
582 | 548 | }, |
583 | 549 | { |
584 | 550 | "cell_type": "code", |
585 | | - "execution_count": null, |
| 551 | + "execution_count": 20, |
586 | 552 | "metadata": { |
587 | 553 | "tags": [] |
588 | 554 | }, |
589 | | - "outputs": [], |
| 555 | + "outputs": [ |
| 556 | + { |
| 557 | + "name": "stdout", |
| 558 | + "output_type": "stream", |
| 559 | + "text": [ |
| 560 | + "200\n", |
| 561 | + "Status: inProgress\n", |
| 562 | + "Items Processed: 3250\n", |
| 563 | + "True\n" |
| 564 | + ] |
| 565 | + } |
| 566 | + ], |
590 | 567 | "source": [ |
591 | 568 | "# Optionally, get indexer status to confirm that it's running\n", |
592 | 569 | "r = requests.get(os.environ['AZURE_SEARCH_ENDPOINT'] + \"/indexers/\" + indexer_name +\n", |
|
632 | 609 | }, |
633 | 610 | { |
634 | 611 | "cell_type": "code", |
635 | | - "execution_count": 28, |
| 612 | + "execution_count": 14, |
636 | 613 | "metadata": {}, |
637 | 614 | "outputs": [ |
638 | 615 | { |
639 | 616 | "name": "stdout", |
640 | 617 | "output_type": "stream", |
641 | 618 | "text": [ |
642 | | - "201\n", |
| 619 | + "204\n", |
643 | 620 | "True\n" |
644 | 621 | ] |
645 | 622 | } |
|
0 commit comments