@mixedbread/sdk 0.28.1 → 0.29.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -376,7 +376,13 @@ export namespace VectorStoreFile {
376
376
  /**
377
377
  * metadata of the chunk
378
378
  */
379
- generated_metadata?: { [key: string]: unknown } | null;
379
+ generated_metadata?:
380
+ | TextInputChunk.MarkdownChunkGeneratedMetadata
381
+ | TextInputChunk.TextChunkGeneratedMetadata
382
+ | TextInputChunk.PdfChunkGeneratedMetadata
383
+ | TextInputChunk.CodeChunkGeneratedMetadata
384
+ | TextInputChunk.AudioChunkGeneratedMetadata
385
+ | null;
380
386
 
381
387
  /**
382
388
  * model used for this chunk
@@ -399,6 +405,98 @@ export namespace VectorStoreFile {
399
405
  text: string;
400
406
  }
401
407
 
408
+ export namespace TextInputChunk {
409
+ export interface MarkdownChunkGeneratedMetadata {
410
+ type?: 'markdown';
411
+
412
+ file_type?: 'text/markdown';
413
+
414
+ language: string;
415
+
416
+ word_count: number;
417
+
418
+ file_size: number;
419
+
420
+ chunk_headings?: Array<MarkdownChunkGeneratedMetadata.ChunkHeading>;
421
+
422
+ heading_context?: Array<MarkdownChunkGeneratedMetadata.HeadingContext>;
423
+
424
+ [k: string]: unknown;
425
+ }
426
+
427
+ export namespace MarkdownChunkGeneratedMetadata {
428
+ export interface ChunkHeading {
429
+ level: number;
430
+
431
+ text: string;
432
+ }
433
+
434
+ export interface HeadingContext {
435
+ level: number;
436
+
437
+ text: string;
438
+ }
439
+ }
440
+
441
+ export interface TextChunkGeneratedMetadata {
442
+ type?: 'text';
443
+
444
+ file_type?: 'text/plain';
445
+
446
+ language: string;
447
+
448
+ word_count: number;
449
+
450
+ file_size: number;
451
+
452
+ [k: string]: unknown;
453
+ }
454
+
455
+ export interface PdfChunkGeneratedMetadata {
456
+ type?: 'pdf';
457
+
458
+ file_type?: 'application/pdf';
459
+
460
+ total_pages: number;
461
+
462
+ total_size: number;
463
+
464
+ [k: string]: unknown;
465
+ }
466
+
467
+ export interface CodeChunkGeneratedMetadata {
468
+ type?: 'code';
469
+
470
+ file_type: string;
471
+
472
+ language: string;
473
+
474
+ word_count: number;
475
+
476
+ file_size: number;
477
+
478
+ [k: string]: unknown;
479
+ }
480
+
481
+ export interface AudioChunkGeneratedMetadata {
482
+ type?: 'audio';
483
+
484
+ file_type: string;
485
+
486
+ file_size: number;
487
+
488
+ total_duration_seconds: number;
489
+
490
+ sample_rate: number;
491
+
492
+ channels: number;
493
+
494
+ audio_format: number;
495
+
496
+ [k: string]: unknown;
497
+ }
498
+ }
499
+
402
500
  export interface ImageURLInputChunk {
403
501
  /**
404
502
  * position of the chunk in a file
@@ -413,7 +511,13 @@ export namespace VectorStoreFile {
413
511
  /**
414
512
  * metadata of the chunk
415
513
  */
416
- generated_metadata?: { [key: string]: unknown } | null;
514
+ generated_metadata?:
515
+ | ImageURLInputChunk.MarkdownChunkGeneratedMetadata
516
+ | ImageURLInputChunk.TextChunkGeneratedMetadata
517
+ | ImageURLInputChunk.PdfChunkGeneratedMetadata
518
+ | ImageURLInputChunk.CodeChunkGeneratedMetadata
519
+ | ImageURLInputChunk.AudioChunkGeneratedMetadata
520
+ | null;
417
521
 
418
522
  /**
419
523
  * model used for this chunk
@@ -442,6 +546,96 @@ export namespace VectorStoreFile {
442
546
  }
443
547
 
444
548
  export namespace ImageURLInputChunk {
549
+ export interface MarkdownChunkGeneratedMetadata {
550
+ type?: 'markdown';
551
+
552
+ file_type?: 'text/markdown';
553
+
554
+ language: string;
555
+
556
+ word_count: number;
557
+
558
+ file_size: number;
559
+
560
+ chunk_headings?: Array<MarkdownChunkGeneratedMetadata.ChunkHeading>;
561
+
562
+ heading_context?: Array<MarkdownChunkGeneratedMetadata.HeadingContext>;
563
+
564
+ [k: string]: unknown;
565
+ }
566
+
567
+ export namespace MarkdownChunkGeneratedMetadata {
568
+ export interface ChunkHeading {
569
+ level: number;
570
+
571
+ text: string;
572
+ }
573
+
574
+ export interface HeadingContext {
575
+ level: number;
576
+
577
+ text: string;
578
+ }
579
+ }
580
+
581
+ export interface TextChunkGeneratedMetadata {
582
+ type?: 'text';
583
+
584
+ file_type?: 'text/plain';
585
+
586
+ language: string;
587
+
588
+ word_count: number;
589
+
590
+ file_size: number;
591
+
592
+ [k: string]: unknown;
593
+ }
594
+
595
+ export interface PdfChunkGeneratedMetadata {
596
+ type?: 'pdf';
597
+
598
+ file_type?: 'application/pdf';
599
+
600
+ total_pages: number;
601
+
602
+ total_size: number;
603
+
604
+ [k: string]: unknown;
605
+ }
606
+
607
+ export interface CodeChunkGeneratedMetadata {
608
+ type?: 'code';
609
+
610
+ file_type: string;
611
+
612
+ language: string;
613
+
614
+ word_count: number;
615
+
616
+ file_size: number;
617
+
618
+ [k: string]: unknown;
619
+ }
620
+
621
+ export interface AudioChunkGeneratedMetadata {
622
+ type?: 'audio';
623
+
624
+ file_type: string;
625
+
626
+ file_size: number;
627
+
628
+ total_duration_seconds: number;
629
+
630
+ sample_rate: number;
631
+
632
+ channels: number;
633
+
634
+ audio_format: number;
635
+
636
+ [k: string]: unknown;
637
+ }
638
+
445
639
  /**
446
640
  * The image input specification.
447
641
  */
@@ -472,7 +666,13 @@ export namespace VectorStoreFile {
472
666
  /**
473
667
  * metadata of the chunk
474
668
  */
475
- generated_metadata?: { [key: string]: unknown } | null;
669
+ generated_metadata?:
670
+ | AudioURLInputChunk.MarkdownChunkGeneratedMetadata
671
+ | AudioURLInputChunk.TextChunkGeneratedMetadata
672
+ | AudioURLInputChunk.PdfChunkGeneratedMetadata
673
+ | AudioURLInputChunk.CodeChunkGeneratedMetadata
674
+ | AudioURLInputChunk.AudioChunkGeneratedMetadata
675
+ | null;
476
676
 
477
677
  /**
478
678
  * model used for this chunk
@@ -506,6 +706,96 @@ export namespace VectorStoreFile {
506
706
  }
507
707
 
508
708
  export namespace AudioURLInputChunk {
709
+ export interface MarkdownChunkGeneratedMetadata {
710
+ type?: 'markdown';
711
+
712
+ file_type?: 'text/markdown';
713
+
714
+ language: string;
715
+
716
+ word_count: number;
717
+
718
+ file_size: number;
719
+
720
+ chunk_headings?: Array<MarkdownChunkGeneratedMetadata.ChunkHeading>;
721
+
722
+ heading_context?: Array<MarkdownChunkGeneratedMetadata.HeadingContext>;
723
+
724
+ [k: string]: unknown;
725
+ }
726
+
727
+ export namespace MarkdownChunkGeneratedMetadata {
728
+ export interface ChunkHeading {
729
+ level: number;
730
+
731
+ text: string;
732
+ }
733
+
734
+ export interface HeadingContext {
735
+ level: number;
736
+
737
+ text: string;
738
+ }
739
+ }
740
+
741
+ export interface TextChunkGeneratedMetadata {
742
+ type?: 'text';
743
+
744
+ file_type?: 'text/plain';
745
+
746
+ language: string;
747
+
748
+ word_count: number;
749
+
750
+ file_size: number;
751
+
752
+ [k: string]: unknown;
753
+ }
754
+
755
+ export interface PdfChunkGeneratedMetadata {
756
+ type?: 'pdf';
757
+
758
+ file_type?: 'application/pdf';
759
+
760
+ total_pages: number;
761
+
762
+ total_size: number;
763
+
764
+ [k: string]: unknown;
765
+ }
766
+
767
+ export interface CodeChunkGeneratedMetadata {
768
+ type?: 'code';
769
+
770
+ file_type: string;
771
+
772
+ language: string;
773
+
774
+ word_count: number;
775
+
776
+ file_size: number;
777
+
778
+ [k: string]: unknown;
779
+ }
780
+
781
+ export interface AudioChunkGeneratedMetadata {
782
+ type?: 'audio';
783
+
784
+ file_type: string;
785
+
786
+ file_size: number;
787
+
788
+ total_duration_seconds: number;
789
+
790
+ sample_rate: number;
791
+
792
+ channels: number;
793
+
794
+ audio_format: number;
795
+
796
+ [k: string]: unknown;
797
+ }
798
+
509
799
  /**
510
800
  * The audio input specification.
511
801
  */
@@ -531,7 +821,13 @@ export namespace VectorStoreFile {
531
821
  /**
532
822
  * metadata of the chunk
533
823
  */
534
- generated_metadata?: { [key: string]: unknown } | null;
824
+ generated_metadata?:
825
+ | VideoURLInputChunk.MarkdownChunkGeneratedMetadata
826
+ | VideoURLInputChunk.TextChunkGeneratedMetadata
827
+ | VideoURLInputChunk.PdfChunkGeneratedMetadata
828
+ | VideoURLInputChunk.CodeChunkGeneratedMetadata
829
+ | VideoURLInputChunk.AudioChunkGeneratedMetadata
830
+ | null;
535
831
 
536
832
  /**
537
833
  * model used for this chunk
@@ -560,6 +856,96 @@ export namespace VectorStoreFile {
560
856
  }
561
857
 
562
858
  export namespace VideoURLInputChunk {
859
+ export interface MarkdownChunkGeneratedMetadata {
860
+ type?: 'markdown';
861
+
862
+ file_type?: 'text/markdown';
863
+
864
+ language: string;
865
+
866
+ word_count: number;
867
+
868
+ file_size: number;
869
+
870
+ chunk_headings?: Array<MarkdownChunkGeneratedMetadata.ChunkHeading>;
871
+
872
+ heading_context?: Array<MarkdownChunkGeneratedMetadata.HeadingContext>;
873
+
874
+ [k: string]: unknown;
875
+ }
876
+
877
+ export namespace MarkdownChunkGeneratedMetadata {
878
+ export interface ChunkHeading {
879
+ level: number;
880
+
881
+ text: string;
882
+ }
883
+
884
+ export interface HeadingContext {
885
+ level: number;
886
+
887
+ text: string;
888
+ }
889
+ }
890
+
891
+ export interface TextChunkGeneratedMetadata {
892
+ type?: 'text';
893
+
894
+ file_type?: 'text/plain';
895
+
896
+ language: string;
897
+
898
+ word_count: number;
899
+
900
+ file_size: number;
901
+
902
+ [k: string]: unknown;
903
+ }
904
+
905
+ export interface PdfChunkGeneratedMetadata {
906
+ type?: 'pdf';
907
+
908
+ file_type?: 'application/pdf';
909
+
910
+ total_pages: number;
911
+
912
+ total_size: number;
913
+
914
+ [k: string]: unknown;
915
+ }
916
+
917
+ export interface CodeChunkGeneratedMetadata {
918
+ type?: 'code';
919
+
920
+ file_type: string;
921
+
922
+ language: string;
923
+
924
+ word_count: number;
925
+
926
+ file_size: number;
927
+
928
+ [k: string]: unknown;
929
+ }
930
+
931
+ export interface AudioChunkGeneratedMetadata {
932
+ type?: 'audio';
933
+
934
+ file_type: string;
935
+
936
+ file_size: number;
937
+
938
+ total_duration_seconds: number;
939
+
940
+ sample_rate: number;
941
+
942
+ channels: number;
943
+
944
+ audio_format: number;
945
+
946
+ [k: string]: unknown;
947
+ }
948
+
563
949
  /**
564
950
  * The video input specification.
565
951
  */