mirror of
https://github.com/bentoml/OpenLLM.git
synced 2026-01-21 22:10:45 -05:00
Commit Graph
Select branches
Hide Pull Requests
dependabot/github_actions/actions-dependencies-67da17a5df
dependabot/pip/production-dependencies-041ea65659
main
pre-commit-ci-update-config
#1
#10
#1000
#1001
#1002
#1004
#1005
#1006
#1007
#1008
#1011
#1012
#1013
#1016
#1017
#1018
#1019
#102
#1022
#1023
#1024
#1027
#1029
#103
#1030
#1031
#1032
#1033
#1034
#1035
#1036
#1038
#1040
#1041
#1043
#1045
#1046
#1047
#1048
#105
#1051
#1052
#1054
#1056
#1057
#1058
#1059
#106
#1060
#1061
#1065
#1066
#1067
#1069
#107
#1070
#1071
#1072
#1073
#1074
#1075
#1077
#1079
#1080
#1081
#1082
#1084
#1085
#1086
#1087
#1088
#1089
#1090
#1091
#1092
#1093
#1094
#1095
#1096
#1097
#1098
#1099
#110
#1100
#1102
#1103
#1104
#1105
#1106
#1107
#1108
#1109
#1110
#1111
#1113
#1114
#1116
#1117
#1118
#1119
#1120
#1121
#1122
#1123
#1124
#1125
#1126
#1127
#1128
#113
#1130
#1131
#1132
#1133
#1134
#1135
#1138
#1139
#114
#1140
#1141
#1142
#1143
#1144
#1145
#1146
#1147
#1148
#1149
#115
#1150
#1151
#1152
#1153
#1154
#1155
#1156
#1157
#1158
#1159
#116
#1160
#1161
#1162
#1163
#1164
#1165
#1166
#1167
#1169
#117
#1170
#1171
#1173
#1174
#1175
#1176
#1177
#1179
#118
#1180
#1181
#1182
#1183
#1187
#1188
#1189
#119
#1190
#1191
#1192
#1193
#1194
#1195
#1196
#1197
#1198
#1199
#12
#1200
#1202
#1203
#1204
#1205
#1206
#1207
#1208
#1209
#1210
#1210
#1211
#1211
#1212
#1213
#1214
#1215
#1216
#1216
#122
#126
#128
#129
#130
#131
#132
#133
#134
#137
#138
#139
#141
#142
#143
#144
#145
#146
#148
#150
#151
#152
#153
#154
#155
#160
#161
#162
#163
#164
#165
#166
#167
#168
#169
#17
#170
#171
#173
#174
#176
#177
#178
#179
#18
#181
#182
#183
#184
#185
#186
#187
#188
#189
#19
#190
#191
#193
#197
#199
#2
#200
#201
#203
#207
#208
#211
#212
#213
#215
#216
#217
#218
#219
#22
#220
#221
#222
#223
#224
#227
#228
#23
#230
#232
#240
#242
#243
#244
#245
#246
#249
#25
#250
#251
#252
#255
#256
#257
#26
#260
#261
#262
#263
#264
#265
#266
#267
#268
#269
#27
#270
#271
#273
#278
#279
#28
#280
#283
#284
#285
#287
#288
#289
#29
#290
#291
#292
#293
#294
#295
#296
#297
#298
#302
#304
#305
#31
#314
#315
#316
#317
#318
#319
#320
#321
#322
#323
#324
#325
#326
#327
#328
#329
#330
#331
#332
#333
#334
#335
#336
#337
#338
#339
#340
#341
#342
#343
#344
#345
#346
#349
#35
#351
#352
#353
#355
#356
#357
#358
#359
#360
#361
#362
#363
#364
#365
#366
#367
#368
#369
#37
#370
#371
#372
#373
#374
#375
#376
#378
#379
#380
#381
#382
#383
#384
#389
#39
#390
#391
#392
#393
#394
#395
#396
#397
#398
#399
#4
#400
#401
#402
#403
#404
#405
#406
#407
#411
#412
#413
#414
#417
#423
#424
#425
#426
#427
#428
#429
#430
#431
#432
#433
#434
#435
#436
#437
#438
#439
#440
#441
#45
#455
#456
#457
#458
#459
#460
#461
#462
#463
#464
#465
#466
#467
#468
#469
#470
#471
#472
#473
#474
#475
#477
#478
#479
#480
#482
#483
#484
#485
#486
#487
#488
#489
#490
#491
#492
#493
#494
#495
#496
#497
#499
#5
#50
#500
#501
#502
#503
#504
#506
#508
#509
#51
#510
#511
#516
#518
#519
#52
#521
#522
#523
#524
#525
#526
#527
#528
#529
#530
#532
#533
#535
#536
#537
#538
#539
#54
#540
#541
#542
#544
#545
#546
#548
#549
#550
#554
#556
#557
#558
#559
#56
#560
#561
#562
#563
#564
#565
#566
#567
#568
#569
#57
#570
#571
#573
#574
#575
#576
#577
#578
#579
#58
#580
#581
#582
#583
#584
#585
#586
#587
#588
#589
#590
#591
#592
#593
#594
#595
#597
#599
#6
#60
#600
#601
#602
#605
#606
#609
#610
#611
#612
#613
#614
#615
#616
#617
#618
#619
#620
#621
#622
#623
#624
#625
#626
#627
#628
#629
#630
#631
#632
#633
#634
#635
#636
#637
#638
#639
#64
#640
#642
#643
#644
#645
#646
#647
#648
#651
#652
#653
#654
#655
#657
#658
#659
#66
#660
#661
#662
#663
#664
#665
#667
#668
#669
#671
#672
#673
#674
#675
#676
#677
#678
#679
#68
#680
#681
#682
#683
#684
#686
#687
#689
#690
#691
#692
#693
#694
#695
#698
#699
#7
#70
#700
#701
#702
#703
#704
#705
#706
#707
#708
#709
#71
#711
#712
#713
#714
#715
#716
#717
#718
#719
#72
#720
#721
#722
#723
#724
#725
#726
#727
#728
#729
#730
#733
#734
#735
#739
#74
#742
#749
#75
#750
#751
#753
#757
#76
#760
#761
#762
#763
#764
#765
#766
#767
#770
#772
#773
#774
#775
#776
#779
#781
#782
#783
#786
#789
#790
#791
#792
#793
#794
#796
#797
#798
#799
#8
#80
#805
#807
#808
#811
#812
#813
#814
#815
#816
#817
#818
#819
#821
#823
#824
#825
#826
#830
#831
#832
#833
#834
#836
#837
#838
#84
#841
#842
#843
#844
#845
#846
#847
#848
#85
#854
#855
#856
#857
#858
#866
#867
#868
#869
#87
#870
#877
#878
#879
#88
#880
#881
#883
#884
#885
#886
#887
#888
#889
#89
#890
#891
#892
#893
#896
#897
#898
#899
#9
#90
#906
#907
#908
#909
#91
#912
#913
#915
#916
#917
#918
#919
#92
#920
#923
#925
#928
#93
#931
#932
#933
#935
#938
#939
#940
#941
#942
#943
#945
#946
#947
#949
#95
#950
#953
#954
#955
#956
#957
#958
#959
#963
#964
#969
#970
#973
#974
#975
#976
#977
#978
#979
#98
#980
#981
#982
#983
#984
#985
#986
#987
#988
#989
#990
#991
#992
#993
#994
#995
#996
#997
#998
#999
v0.0.10
v0.0.11
v0.0.12
v0.0.13
v0.0.14
v0.0.15
v0.0.16
v0.0.17
v0.0.18
v0.0.19
v0.0.21
v0.0.22
v0.0.23
v0.0.24
v0.0.25
v0.0.26
v0.0.27
v0.0.28
v0.0.29
v0.0.30
v0.0.31
v0.0.32
v0.0.33
v0.0.34
v0.0.4
v0.0.5
v0.0.6
v0.0.7
v0.0.8
v0.0.9
v0.1.0
v0.1.1
v0.1.10
v0.1.11
v0.1.12
v0.1.13
v0.1.14
v0.1.15
v0.1.16
v0.1.17
v0.1.18
v0.1.19
v0.1.2
v0.1.20
v0.1.3
v0.1.4
v0.1.5
v0.1.6
v0.1.7
v0.1.8
v0.1.9
v0.2.0
v0.2.1
v0.2.10
v0.2.11
v0.2.12
v0.2.13
v0.2.14
v0.2.15
v0.2.16
v0.2.17
v0.2.18
v0.2.19
v0.2.2
v0.2.20
v0.2.21
v0.2.22
v0.2.23
v0.2.24
v0.2.25
v0.2.26
v0.2.27
v0.2.3
v0.2.4
v0.2.5
v0.2.6
v0.2.7
v0.2.8
v0.2.9
v0.3.0
v0.3.1
v0.3.10
v0.3.11
v0.3.12
v0.3.13
v0.3.14
v0.3.2
v0.3.3
v0.3.4
v0.3.5
v0.3.6
v0.3.7
v0.3.8
v0.3.9
v0.4.0
v0.4.1
v0.4.10
v0.4.11
v0.4.12
v0.4.13
v0.4.14
v0.4.15
v0.4.16
v0.4.17
v0.4.18
v0.4.19
v0.4.2
v0.4.20
v0.4.21
v0.4.22
v0.4.23
v0.4.24
v0.4.25
v0.4.26
v0.4.27
v0.4.28
v0.4.29
v0.4.3
v0.4.30
v0.4.31
v0.4.32
v0.4.33
v0.4.34
v0.4.35
v0.4.36
v0.4.37
v0.4.38
v0.4.39
v0.4.4
v0.4.40
v0.4.41
v0.4.42
v0.4.43
v0.4.44
v0.4.5
v0.4.6
v0.4.7
v0.4.8
v0.4.9
v0.5.0
v0.5.0-alpha
v0.5.0-alpha.1
v0.5.0-alpha.10
v0.5.0-alpha.11
v0.5.0-alpha.12
v0.5.0-alpha.13
v0.5.0-alpha.14
v0.5.0-alpha.15
v0.5.0-alpha.2
v0.5.0-alpha.3
v0.5.0-alpha.4
v0.5.0-alpha.5
v0.5.0-alpha.6
v0.5.0-alpha.7
v0.5.0-alpha.8
v0.5.0-alpha.9
v0.5.1
v0.5.2
v0.5.3
v0.5.4
v0.5.5
v0.5.6
v0.5.7
v0.6.0
v0.6.1
v0.6.10
v0.6.11
v0.6.12
v0.6.13
v0.6.14
v0.6.15
v0.6.16
v0.6.17
v0.6.18
v0.6.19
v0.6.2
v0.6.20
v0.6.21
v0.6.22
v0.6.23
v0.6.24
v0.6.25
v0.6.26
v0.6.27
v0.6.28
v0.6.29
v0.6.3
v0.6.30
v0.6.4
v0.6.5
v0.6.6
v0.6.7
v0.6.8
v0.6.9
Select branches
Hide Pull Requests
dependabot/github_actions/actions-dependencies-67da17a5df
dependabot/pip/production-dependencies-041ea65659
main
pre-commit-ci-update-config
#1
#10
#1000
#1001
#1002
#1004
#1005
#1006
#1007
#1008
#1011
#1012
#1013
#1016
#1017
#1018
#1019
#102
#1022
#1023
#1024
#1027
#1029
#103
#1030
#1031
#1032
#1033
#1034
#1035
#1036
#1038
#1040
#1041
#1043
#1045
#1046
#1047
#1048
#105
#1051
#1052
#1054
#1056
#1057
#1058
#1059
#106
#1060
#1061
#1065
#1066
#1067
#1069
#107
#1070
#1071
#1072
#1073
#1074
#1075
#1077
#1079
#1080
#1081
#1082
#1084
#1085
#1086
#1087
#1088
#1089
#1090
#1091
#1092
#1093
#1094
#1095
#1096
#1097
#1098
#1099
#110
#1100
#1102
#1103
#1104
#1105
#1106
#1107
#1108
#1109
#1110
#1111
#1113
#1114
#1116
#1117
#1118
#1119
#1120
#1121
#1122
#1123
#1124
#1125
#1126
#1127
#1128
#113
#1130
#1131
#1132
#1133
#1134
#1135
#1138
#1139
#114
#1140
#1141
#1142
#1143
#1144
#1145
#1146
#1147
#1148
#1149
#115
#1150
#1151
#1152
#1153
#1154
#1155
#1156
#1157
#1158
#1159
#116
#1160
#1161
#1162
#1163
#1164
#1165
#1166
#1167
#1169
#117
#1170
#1171
#1173
#1174
#1175
#1176
#1177
#1179
#118
#1180
#1181
#1182
#1183
#1187
#1188
#1189
#119
#1190
#1191
#1192
#1193
#1194
#1195
#1196
#1197
#1198
#1199
#12
#1200
#1202
#1203
#1204
#1205
#1206
#1207
#1208
#1209
#1210
#1210
#1211
#1211
#1212
#1213
#1214
#1215
#1216
#1216
#122
#126
#128
#129
#130
#131
#132
#133
#134
#137
#138
#139
#141
#142
#143
#144
#145
#146
#148
#150
#151
#152
#153
#154
#155
#160
#161
#162
#163
#164
#165
#166
#167
#168
#169
#17
#170
#171
#173
#174
#176
#177
#178
#179
#18
#181
#182
#183
#184
#185
#186
#187
#188
#189
#19
#190
#191
#193
#197
#199
#2
#200
#201
#203
#207
#208
#211
#212
#213
#215
#216
#217
#218
#219
#22
#220
#221
#222
#223
#224
#227
#228
#23
#230
#232
#240
#242
#243
#244
#245
#246
#249
#25
#250
#251
#252
#255
#256
#257
#26
#260
#261
#262
#263
#264
#265
#266
#267
#268
#269
#27
#270
#271
#273
#278
#279
#28
#280
#283
#284
#285
#287
#288
#289
#29
#290
#291
#292
#293
#294
#295
#296
#297
#298
#302
#304
#305
#31
#314
#315
#316
#317
#318
#319
#320
#321
#322
#323
#324
#325
#326
#327
#328
#329
#330
#331
#332
#333
#334
#335
#336
#337
#338
#339
#340
#341
#342
#343
#344
#345
#346
#349
#35
#351
#352
#353
#355
#356
#357
#358
#359
#360
#361
#362
#363
#364
#365
#366
#367
#368
#369
#37
#370
#371
#372
#373
#374
#375
#376
#378
#379
#380
#381
#382
#383
#384
#389
#39
#390
#391
#392
#393
#394
#395
#396
#397
#398
#399
#4
#400
#401
#402
#403
#404
#405
#406
#407
#411
#412
#413
#414
#417
#423
#424
#425
#426
#427
#428
#429
#430
#431
#432
#433
#434
#435
#436
#437
#438
#439
#440
#441
#45
#455
#456
#457
#458
#459
#460
#461
#462
#463
#464
#465
#466
#467
#468
#469
#470
#471
#472
#473
#474
#475
#477
#478
#479
#480
#482
#483
#484
#485
#486
#487
#488
#489
#490
#491
#492
#493
#494
#495
#496
#497
#499
#5
#50
#500
#501
#502
#503
#504
#506
#508
#509
#51
#510
#511
#516
#518
#519
#52
#521
#522
#523
#524
#525
#526
#527
#528
#529
#530
#532
#533
#535
#536
#537
#538
#539
#54
#540
#541
#542
#544
#545
#546
#548
#549
#550
#554
#556
#557
#558
#559
#56
#560
#561
#562
#563
#564
#565
#566
#567
#568
#569
#57
#570
#571
#573
#574
#575
#576
#577
#578
#579
#58
#580
#581
#582
#583
#584
#585
#586
#587
#588
#589
#590
#591
#592
#593
#594
#595
#597
#599
#6
#60
#600
#601
#602
#605
#606
#609
#610
#611
#612
#613
#614
#615
#616
#617
#618
#619
#620
#621
#622
#623
#624
#625
#626
#627
#628
#629
#630
#631
#632
#633
#634
#635
#636
#637
#638
#639
#64
#640
#642
#643
#644
#645
#646
#647
#648
#651
#652
#653
#654
#655
#657
#658
#659
#66
#660
#661
#662
#663
#664
#665
#667
#668
#669
#671
#672
#673
#674
#675
#676
#677
#678
#679
#68
#680
#681
#682
#683
#684
#686
#687
#689
#690
#691
#692
#693
#694
#695
#698
#699
#7
#70
#700
#701
#702
#703
#704
#705
#706
#707
#708
#709
#71
#711
#712
#713
#714
#715
#716
#717
#718
#719
#72
#720
#721
#722
#723
#724
#725
#726
#727
#728
#729
#730
#733
#734
#735
#739
#74
#742
#749
#75
#750
#751
#753
#757
#76
#760
#761
#762
#763
#764
#765
#766
#767
#770
#772
#773
#774
#775
#776
#779
#781
#782
#783
#786
#789
#790
#791
#792
#793
#794
#796
#797
#798
#799
#8
#80
#805
#807
#808
#811
#812
#813
#814
#815
#816
#817
#818
#819
#821
#823
#824
#825
#826
#830
#831
#832
#833
#834
#836
#837
#838
#84
#841
#842
#843
#844
#845
#846
#847
#848
#85
#854
#855
#856
#857
#858
#866
#867
#868
#869
#87
#870
#877
#878
#879
#88
#880
#881
#883
#884
#885
#886
#887
#888
#889
#89
#890
#891
#892
#893
#896
#897
#898
#899
#9
#90
#906
#907
#908
#909
#91
#912
#913
#915
#916
#917
#918
#919
#92
#920
#923
#925
#928
#93
#931
#932
#933
#935
#938
#939
#940
#941
#942
#943
#945
#946
#947
#949
#95
#950
#953
#954
#955
#956
#957
#958
#959
#963
#964
#969
#970
#973
#974
#975
#976
#977
#978
#979
#98
#980
#981
#982
#983
#984
#985
#986
#987
#988
#989
#990
#991
#992
#993
#994
#995
#996
#997
#998
#999
v0.0.10
v0.0.11
v0.0.12
v0.0.13
v0.0.14
v0.0.15
v0.0.16
v0.0.17
v0.0.18
v0.0.19
v0.0.21
v0.0.22
v0.0.23
v0.0.24
v0.0.25
v0.0.26
v0.0.27
v0.0.28
v0.0.29
v0.0.30
v0.0.31
v0.0.32
v0.0.33
v0.0.34
v0.0.4
v0.0.5
v0.0.6
v0.0.7
v0.0.8
v0.0.9
v0.1.0
v0.1.1
v0.1.10
v0.1.11
v0.1.12
v0.1.13
v0.1.14
v0.1.15
v0.1.16
v0.1.17
v0.1.18
v0.1.19
v0.1.2
v0.1.20
v0.1.3
v0.1.4
v0.1.5
v0.1.6
v0.1.7
v0.1.8
v0.1.9
v0.2.0
v0.2.1
v0.2.10
v0.2.11
v0.2.12
v0.2.13
v0.2.14
v0.2.15
v0.2.16
v0.2.17
v0.2.18
v0.2.19
v0.2.2
v0.2.20
v0.2.21
v0.2.22
v0.2.23
v0.2.24
v0.2.25
v0.2.26
v0.2.27
v0.2.3
v0.2.4
v0.2.5
v0.2.6
v0.2.7
v0.2.8
v0.2.9
v0.3.0
v0.3.1
v0.3.10
v0.3.11
v0.3.12
v0.3.13
v0.3.14
v0.3.2
v0.3.3
v0.3.4
v0.3.5
v0.3.6
v0.3.7
v0.3.8
v0.3.9
v0.4.0
v0.4.1
v0.4.10
v0.4.11
v0.4.12
v0.4.13
v0.4.14
v0.4.15
v0.4.16
v0.4.17
v0.4.18
v0.4.19
v0.4.2
v0.4.20
v0.4.21
v0.4.22
v0.4.23
v0.4.24
v0.4.25
v0.4.26
v0.4.27
v0.4.28
v0.4.29
v0.4.3
v0.4.30
v0.4.31
v0.4.32
v0.4.33
v0.4.34
v0.4.35
v0.4.36
v0.4.37
v0.4.38
v0.4.39
v0.4.4
v0.4.40
v0.4.41
v0.4.42
v0.4.43
v0.4.44
v0.4.5
v0.4.6
v0.4.7
v0.4.8
v0.4.9
v0.5.0
v0.5.0-alpha
v0.5.0-alpha.1
v0.5.0-alpha.10
v0.5.0-alpha.11
v0.5.0-alpha.12
v0.5.0-alpha.13
v0.5.0-alpha.14
v0.5.0-alpha.15
v0.5.0-alpha.2
v0.5.0-alpha.3
v0.5.0-alpha.4
v0.5.0-alpha.5
v0.5.0-alpha.6
v0.5.0-alpha.7
v0.5.0-alpha.8
v0.5.0-alpha.9
v0.5.1
v0.5.2
v0.5.3
v0.5.4
v0.5.5
v0.5.6
v0.5.7
v0.6.0
v0.6.1
v0.6.10
v0.6.11
v0.6.12
v0.6.13
v0.6.14
v0.6.15
v0.6.16
v0.6.17
v0.6.18
v0.6.19
v0.6.2
v0.6.20
v0.6.21
v0.6.22
v0.6.23
v0.6.24
v0.6.25
v0.6.26
v0.6.27
v0.6.28
v0.6.29
v0.6.3
v0.6.30
v0.6.4
v0.6.5
v0.6.6
v0.6.7
v0.6.8
v0.6.9
-
689b83bbe3
fix(loading): make sure not to load to cuda with kbit quantisation
aarnphm-ec2-dev
2023-08-10 19:39:01 +00:00 -
7c3646bb89
infra: bump to homebrew tap release to 0.2.20 [generated] [skip ci]
Aaron Pham
2023-08-10 03:26:20 +00:00 -
d99e342d88
infra: bump to dev version of 0.2.21.dev0 [generated] [skip ci]
Aaron Pham
2023-08-10 03:23:24 +00:00 -
78912a314c
infra: prepare for release 0.2.20 [generated] [skip ci]
v0.2.20
Aaron Pham
2023-08-10 03:04:19 +00:00 -
bc13b6f137
fix: update dependencies with brew tap
Aaron
2023-08-09 22:54:37 -04:00 -
e0daea6e78
fix(compile): absolute import for compiled wheels
Aaron
2023-08-09 22:46:17 -04:00 -
6fbacecaf6
infra: bump to dev version of 0.2.20.dev0 [generated] [skip ci]
Aaron Pham
2023-08-10 02:49:10 +00:00 -
99c8f299ce
infra: prepare for release 0.2.19 [generated] [skip ci]
v0.2.19
Aaron Pham
2023-08-10 02:26:15 +00:00 -
6143521547
fix: release compiled wheels and 0.2.18 tap (#193)
Aaron Pham
2023-08-09 21:14:34 -04:00 -
f0783420a2
infra: bump to dev version of 0.2.19.dev0 [generated] [skip ci]
Aaron Pham
2023-08-10 00:10:35 +00:00 -
221d959a46
infra: prepare for release 0.2.18 [generated] [skip ci]
v0.2.18
Aaron Pham
2023-08-09 23:50:37 +00:00 -
a44a317825
fix(ci): running test tap [skip ci]
Aaron
2023-08-09 19:48:29 -04:00 -
0d55d74868
fix: remove invalid token on dispatch [skip ci]
Aaron
2023-08-09 19:44:42 -04:00 -
dfc4b489c5
feat(build): notes on compiled wheels for Bento
aarnphm-ec2-dev
2023-08-09 21:52:34 +00:00 -
0640af026c
chore(docs): add instruction for compiled module development [skip ci]
aarnphm-ec2-dev
2023-08-09 21:30:43 +00:00 -
b1445c6516
refactor(cli): compiled wheels and extension modules (#191)
Aaron Pham
2023-08-09 17:10:15 -04:00 -
ae11e487d9
fix(brew): specific installation from gzip [skip ci]
Aaron
2023-08-08 22:32:11 -04:00 -
aaa8ec433c
chore(ci): running pyright last
Aaron
2023-08-08 22:19:08 -04:00 -
21143fdfab
fix(brew): set correct url for release
Aaron
2023-08-08 22:15:23 -04:00 -
b9dd54f634
feat: homebrew tap (#190)
Aaron Pham
2023-08-08 22:11:48 -04:00 -
deaee67b47
fix(loading): make sure to cast the model to cuda if PyTorch
aarnphm-ec2-dev
2023-08-09 01:42:11 +00:00 -
ae35ee8115
fix(build): set legacy serialisation for vllm on Bento
aarnphm-ec2-dev
2023-08-08 10:17:48 +00:00 -
2d47a54efd
feat(strategy): spawn one runner instance (#189)
Aaron Pham
2023-08-08 05:47:11 -04:00 -
9c3019d236
infra: bump to dev version of 0.2.18.dev0 [generated] [skip ci]
Aaron Pham
2023-08-08 05:44:51 +00:00 -
126491f272
infra: prepare for release 0.2.17 [generated] [skip ci]
v0.2.17
Aaron Pham
2023-08-08 05:34:43 +00:00 -
cb6f3aa48e
feat: --force-push to allow force push to bentocloud (#188)
Aaron Pham
2023-08-08 01:06:59 -04:00 -
371a7c896c
fix: loading models within k8s API server
Aaron
2023-08-08 00:22:48 -04:00 -
0139613f3c
ci: pre-commit autoupdate [pre-commit.ci] [skip ci] (#187)
pre-commit-ci[bot]
2023-08-07 18:02:26 -04:00 -
21ea7e493f
feat(generation): initial work for generating tokens (#186)
Aaron Pham
2023-08-06 20:04:40 -04:00 -
2d5be909cd
fix(models): setup xformers and loading PyTorch meta weights (#185)
Aaron Pham
2023-08-06 03:25:02 -04:00 -
96b25842d1
chore(docs): update security notes obsidian style [skip ci]
Aaron
2023-08-06 02:00:02 -04:00 -
74a928f6f3
chore: CODE_OF_CONDUCT.md [skip ci]
Aaron Pham
2023-08-06 01:56:08 -04:00 -
752de09626
fix(ci): update version correctly [skip ci] (#184)
Aaron Pham
2023-08-06 01:18:33 -04:00 -
4875c3a109
feat: optimize model saving and loading on single GPU (#183)
Aaron Pham
2023-08-06 01:00:49 -04:00 -
8bba90f611
fix: add release for correct CI version [skip ci]
aarnphm-ec2-dev
2023-08-05 07:41:50 +00:00 -
82d7ab67f3
infra: bump to dev version of ..1.dev0 [generated] [skip ci]
Aaron Pham
2023-08-04 16:56:48 +00:00 -
f68beb5ccb
infra: prepare for release 0.2.16 [generated] [skip ci]
v0.2.16
Aaron Pham
2023-08-04 16:43:29 +00:00 -
90072ec5ee
fix(regression): setting quantize only if it is not None
Aaron
2023-08-04 12:40:55 -04:00 -
ba07205156
fix: disable building xformers from source
Aaron
2023-08-04 12:14:04 -04:00 -
794719670e
chore: update README [skip ci]
Aaron
2023-08-04 12:10:21 -04:00 -
cdc6bae0e9
infra: bump to dev version of ..1.dev0 [generated] [skip ci]
Aaron Pham
2023-08-04 15:47:20 +00:00 -
9d1476e360
infra: prepare for release 0.2.15 [generated] [skip ci]
v0.2.15
Aaron Pham
2023-08-04 15:32:47 +00:00 -
287b7f9ab2
fix: releases issue when building new container [skip ci]
Aaron
2023-08-04 11:31:02 -04:00 -
20deb3354d
infra: bump to dev version of 0.2.15.dev0 [generated] [skip ci]
Aaron
2023-08-04 11:11:14 -04:00 -
cb05446760
infra: prepare for release 0.2.14 [generated] [skip ci]
v0.2.14
Aaron Pham
2023-08-04 14:50:59 +00:00 -
975a1d0349
fix: remove tokens for release [skip ci]
Aaron
2023-08-04 10:49:06 -04:00 -
1e74e967d1
fix(container): correct cache directory
Aaron
2023-08-04 10:31:06 -04:00 -
2541a0f8dc
infra: initial work on compiling mypyc wheels (#182)
Aaron Pham
2023-08-04 10:20:03 -04:00 -
2cc264aa72
fix(vllm): correctly load given model id from envvar (#181)
Aaron Pham
2023-08-03 16:34:35 -04:00 -
db8e47bc5b
fix(build): correct module type for stubs and strip assert [skip ci]
Aaron
2023-08-03 04:15:55 -04:00 -
8f74e24c2f
fix: clone all for nightly strategy
Aaron
2023-08-03 03:17:18 -04:00 -
b949106daf
fix(ci): rename runner name [skip ci]
Aaron
2023-08-03 02:24:45 -04:00 -
e9eff70978
infra: bump to dev version of 0.2.14.dev0 [generated] [skip ci]
Aaron Pham
2023-08-03 06:18:57 +00:00 -
8428692d45
infra: prepare for release 0.2.13 [generated] [skip ci]
v0.2.13
Aaron Pham
2023-08-03 06:06:09 +00:00 -
cac7a19be9
fix(build): to run on tags [skip ci]
Aaron
2023-08-03 01:59:18 -04:00 -
29ca9f398f
fix: add arch_list for cross compiling
aarnphm-ec2-dev
2023-08-03 04:33:48 +00:00 -
f5eb21ede0
revert: "chore(aws): use g4dn for more availability"
Aaron
2023-08-02 23:55:29 -04:00 -
a01d867bc7
chore(base): add auto-gptq CUDA kernel
aarnphm-ec2-dev
2023-08-03 02:40:06 +00:00 -
820b4991fa
chore(stubs): add generated for auto-gptq and vllm [skip ci]
aarnphm-ec2-dev
2023-08-03 02:28:24 +00:00 -
a06464bdc7
chore(aws): use g4dn for more availability
aarnphm-ec2-dev
2023-08-03 02:17:37 +00:00 -
af64a6dfd5
chore(docs): update to obsidian README format
Aaron
2023-08-02 21:49:33 -04:00 -
b349820429
fix(build): add `
--device` into envvar
aarnphm-ec2-dev
2023-08-03 00:44:40 +00:00 -
cfc7f3888d
chore(vllm): add all supported models (#179)
Aaron Pham
2023-08-02 17:42:02 -04:00 -
72337410cf
fix: nightly resolver for correct tag (#177)
Aaron Pham
2023-08-02 13:10:50 -04:00 -
d4fbfa5e5c
fix: custom release strategy for correct naming
Aaron
2023-08-02 03:03:21 -04:00 -
acb81a6e1a
fix(build): dispatch container via workflow calls (#174)
Aaron Pham
2023-08-02 01:54:10 -04:00 -
f989ebd4b9
infra: bump to dev version of 0.2.13.dev0 [generated] [skip ci]
Aaron
2023-08-01 19:52:56 -04:00 -
57fdbda192
infra: prepare for release 0.2.12 [generated] [skip ci]
v0.2.12
Aaron Pham
2023-08-01 23:27:01 +00:00 -
af54ff299f
fix(ec2): increase subnet availability to all available zone with g5 instances
Aaron
2023-08-01 16:07:41 -04:00 -
c2ed1d56da
chore(release): update base container restriction (#173)
pre-commit-ci[bot]
2023-08-01 15:25:17 -04:00 -
6ba8899743
fix: remove invalid OPENLLMDEVDEBUG envvar
Aaron
2023-08-01 01:52:08 -04:00 -
961455c762
fix(cli): always --force on
--push
Aaron
2023-07-31 23:39:56 -04:00 -
ca5e3c7ae5
fix: correct setup property for envvar instance
Aaron
2023-07-31 23:34:42 -04:00 -
16f032417e
revert: "infra: reduce instance type for more lenient"
Aaron
2023-07-31 21:34:56 -04:00 -
4a1d849203
infra: reduce instance type for more lenient
Aaron
2023-07-31 21:25:59 -04:00 -
23c5aa5958
revert: remove unreleased changelog
Aaron
2023-07-31 21:07:00 -04:00 -
fa0e947dd0
chore: add editorconfig [skip ci]
Aaron
2023-07-31 20:21:22 -04:00 -
729e423b17
chore(bnb): filter warnings message on CPU (#170)
Aaron Pham
2023-07-31 15:48:59 -04:00 -
19d88d4cb8
infra: ignore rev that update styling [skip ci]
Aaron
2023-07-31 09:07:58 -04:00 -
e01853a81c
chore(infra): disable update-changelog for now [skip ci]
Aaron
2023-07-31 09:05:50 -04:00 -
ec3c381e8c
infra: add instruction for using docker images from release notes (#169)
Aaron Pham
2023-07-31 08:39:10 -04:00 -
8c2867d26d
style: define experimental guidelines (#168)
Aaron Pham
2023-07-31 07:54:26 -04:00 -
2c2070f69f
chore(deps): bump docker/setup-qemu-action from 2.1.0 to 2.2.0 [skip ci] (#165)
dependabot[bot]
2023-07-31 07:52:16 -04:00 -
94c949c22c
chore(deps): bump aws-actions/configure-aws-credentials from 1 to 2 [skip ci] (#167)
dependabot[bot]
2023-07-31 07:45:50 -04:00 -
9592ca02fb
chore(deps): bump docker/setup-buildx-action from 2.5.0 to 2.9.1 [skip ci] (#164)
dependabot[bot]
2023-07-31 07:45:26 -04:00 -
4d566fee09
chore(deps): bump peter-evans/create-pull-request from 4 to 5 [skip ci] (#166)
dependabot[bot]
2023-07-31 07:45:05 -04:00 -
b5652e7d66
fix(ci): agree with signing
Aaron
2023-07-31 06:40:14 -04:00 -
431b326dd3
chore(deps): bump docker/login-action from 2.1.0 to 2.2.0 (#163)
dependabot[bot]
2023-07-31 09:26:06 +00:00 -
ae17322b73
fix(ci): correct set digest for signing images
Aaron
2023-07-31 04:27:15 -04:00 -
4fbfb363bf
infra: update changelog and added readme badges [generated] (#162)
Aaron Pham
2023-07-31 04:02:02 -04:00 -
fec68d732b
fix(ci): Correctly set signing for pushing container images (#161)
Aaron Pham
2023-07-31 03:43:07 -04:00 -
ef94c6b98a
feat(container): vLLM build and base image strategies (#142)
Aaron Pham
2023-07-31 02:44:52 -04:00 -
001ff6b5ac
docs: update README.md typos (#155)
RichardScottOZ
2023-07-29 19:10:40 +09:30 -
0c79fabd1a
chore(release): add darwin binary to release notes (#154)
Aaron Pham
2023-07-28 15:00:42 -04:00 -
4de0ca8a13
infra: bump to dev version of 0.2.12.dev0 [generated] [skip ci]
Aaron Pham
2023-07-28 00:14:52 +00:00 -
7d9dcb5d40
infra: prepare for release 0.2.11 [generated] [skip ci]
v0.2.11
Aaron Pham
2023-07-28 00:04:32 +00:00 -
fc66ff275b
fix: make sure to add torch to dependencies
aarnphm-ec2-dev
2023-07-28 00:01:52 +00:00 -
15640a85cd
feat: supports embeddings for T5 and ChatGLM family generation (#153)
Aaron Pham
2023-07-27 16:43:43 -04:00 -
e075bd25ea
chore: add NousResearch's as non-gated Llama (#152)
Aaron Pham
2023-07-27 15:30:56 -04:00 -
eacd8d9f46
fix(pre-commit): disable auto fixes (#151)
Aaron Pham
2023-07-27 13:37:09 -04:00