@@ -618,9 +618,76 @@ This endpoint is public (no API key check). By default, it is read-only. To make
618
618
619
619
``` json
620
620
{
621
- "default_generation_settings" : { ... },
621
+ "default_generation_settings" : {
622
+ "id" : 0 ,
623
+ "id_task" : -1 ,
624
+ "n_ctx" : 1024 ,
625
+ "speculative" : false ,
626
+ "is_processing" : false ,
627
+ "params" : {
628
+ "n_predict" : -1 ,
629
+ "seed" : 4294967295 ,
630
+ "temperature" : 0.800000011920929 ,
631
+ "dynatemp_range" : 0.0 ,
632
+ "dynatemp_exponent" : 1.0 ,
633
+ "top_k" : 40 ,
634
+ "top_p" : 0.949999988079071 ,
635
+ "min_p" : 0.05000000074505806 ,
636
+ "xtc_probability" : 0.0 ,
637
+ "xtc_threshold" : 0.10000000149011612 ,
638
+ "typical_p" : 1.0 ,
639
+ "repeat_last_n" : 64 ,
640
+ "repeat_penalty" : 1.0 ,
641
+ "presence_penalty" : 0.0 ,
642
+ "frequency_penalty" : 0.0 ,
643
+ "dry_multiplier" : 0.0 ,
644
+ "dry_base" : 1.75 ,
645
+ "dry_allowed_length" : 2 ,
646
+ "dry_penalty_last_n" : -1 ,
647
+ "dry_sequence_breakers" : [
648
+ " \n " ,
649
+ " :" ,
650
+ " \" " ,
651
+ " *"
652
+ ],
653
+ "mirostat" : 0 ,
654
+ "mirostat_tau" : 5.0 ,
655
+ "mirostat_eta" : 0.10000000149011612 ,
656
+ "penalize_nl" : false ,
657
+ "stop" : [],
658
+ "max_tokens" : -1 ,
659
+ "n_keep" : 0 ,
660
+ "n_discard" : 0 ,
661
+ "ignore_eos" : false ,
662
+ "stream" : true ,
663
+ "n_probs" : 0 ,
664
+ "min_keep" : 0 ,
665
+ "grammar" : " " ,
666
+ "samplers" : [
667
+ " dry" ,
668
+ " top_k" ,
669
+ " typ_p" ,
670
+ " top_p" ,
671
+ " min_p" ,
672
+ " xtc" ,
673
+ " temperature"
674
+ ],
675
+ "speculative.n_max" : 16 ,
676
+ "speculative.n_min" : 5 ,
677
+ "speculative.p_min" : 0.8999999761581421 ,
678
+ "timings_per_token" : false
679
+ },
680
+ "prompt" : " " ,
681
+ "next_token" : {
682
+ "has_next_token" : true ,
683
+ "has_new_line" : false ,
684
+ "n_remain" : -1 ,
685
+ "n_decoded" : 0 ,
686
+ "stopping_word" : " "
687
+ }
688
+ },
622
689
"total_slots" : 1 ,
623
- "chat_template" : " "
690
+ "chat_template" : " ... "
624
691
}
625
692
```
626
693
@@ -739,56 +806,74 @@ Example:
739
806
740
807
``` json
741
808
[
742
- {
743
- "dynatemp_exponent" : 1.0 ,
744
- "dynatemp_range" : 0.0 ,
745
- "frequency_penalty" : 0.0 ,
746
- "grammar" : " " ,
747
- "id" : 0 ,
748
- "ignore_eos" : false ,
749
- "is_processing" : false ,
750
- "logit_bias" : [],
751
- "min_p" : 0.05000000074505806 ,
752
- "mirostat" : 0 ,
753
- "mirostat_eta" : 0.10000000149011612 ,
754
- "mirostat_tau" : 5.0 ,
755
- "model" : " llama-2-7b-32k-instruct.Q2_K.gguf" ,
756
- "n_ctx" : 2048 ,
757
- "n_keep" : 0 ,
758
- "n_predict" : 100000 ,
759
- "n_probs" : 0 ,
760
- "next_token" : {
761
- "has_next_token" : true ,
762
- "n_remain" : -1 ,
763
- "n_decoded" : 0 ,
764
- "stopped_eos" : false ,
765
- "stopped_limit" : false ,
766
- "stopped_word" : false ,
767
- "stopping_word" : " "
768
- },
769
- "penalize_nl" : true ,
770
- "presence_penalty" : 0.0 ,
771
- "prompt" : " Say hello to llama.cpp" ,
772
- "repeat_last_n" : 64 ,
773
- "repeat_penalty" : 1.100000023841858 ,
774
- "samplers" : [
775
- " top_k" ,
776
- " typical_p" ,
777
- " top_p" ,
778
- " min_p" ,
779
- " temperature"
780
- ],
781
- "seed" : 42 ,
782
- "stop" : [
783
- " \n "
784
- ],
785
- "stream" : false ,
786
- "task_id" : 0 ,
787
- "temperature" : 0.0 ,
788
- "top_k" : 40 ,
789
- "top_p" : 0.949999988079071 ,
790
- "typical_p" : 1.0
809
+ {
810
+ "id" : 0 ,
811
+ "id_task" : -1 ,
812
+ "n_ctx" : 1024 ,
813
+ "speculative" : false ,
814
+ "is_processing" : false ,
815
+ "params" : {
816
+ "n_predict" : -1 ,
817
+ "seed" : 4294967295 ,
818
+ "temperature" : 0.800000011920929 ,
819
+ "dynatemp_range" : 0.0 ,
820
+ "dynatemp_exponent" : 1.0 ,
821
+ "top_k" : 40 ,
822
+ "top_p" : 0.949999988079071 ,
823
+ "min_p" : 0.05000000074505806 ,
824
+ "xtc_probability" : 0.0 ,
825
+ "xtc_threshold" : 0.10000000149011612 ,
826
+ "typical_p" : 1.0 ,
827
+ "repeat_last_n" : 64 ,
828
+ "repeat_penalty" : 1.0 ,
829
+ "presence_penalty" : 0.0 ,
830
+ "frequency_penalty" : 0.0 ,
831
+ "dry_multiplier" : 0.0 ,
832
+ "dry_base" : 1.75 ,
833
+ "dry_allowed_length" : 2 ,
834
+ "dry_penalty_last_n" : -1 ,
835
+ "dry_sequence_breakers" : [
836
+ " \n " ,
837
+ " :" ,
838
+ " \" " ,
839
+ " *"
840
+ ],
841
+ "mirostat" : 0 ,
842
+ "mirostat_tau" : 5.0 ,
843
+ "mirostat_eta" : 0.10000000149011612 ,
844
+ "penalize_nl" : false ,
845
+ "stop" : [],
846
+ "max_tokens" : -1 ,
847
+ "n_keep" : 0 ,
848
+ "n_discard" : 0 ,
849
+ "ignore_eos" : false ,
850
+ "stream" : true ,
851
+ "n_probs" : 0 ,
852
+ "min_keep" : 0 ,
853
+ "grammar" : " " ,
854
+ "samplers" : [
855
+ " dry" ,
856
+ " top_k" ,
857
+ " typ_p" ,
858
+ " top_p" ,
859
+ " min_p" ,
860
+ " xtc" ,
861
+ " temperature"
862
+ ],
863
+ "speculative.n_max" : 16 ,
864
+ "speculative.n_min" : 5 ,
865
+ "speculative.p_min" : 0.8999999761581421 ,
866
+ "timings_per_token" : false
867
+ },
868
+ "prompt" : " " ,
869
+ "next_token" : {
870
+ "has_next_token" : true ,
871
+ "has_new_line" : false ,
872
+ "n_remain" : -1 ,
873
+ "n_decoded" : 0 ,
874
+ "stopping_word" : " "
791
875
}
876
+ }
792
877
]
793
878
```
794
879
0 commit comments