Spaces:
Running
Running
Commit
·
86fe272
1
Parent(s):
02f502d
Push to HF space
Browse files- Dockerfile +6 -2
- data/lilac.yml +448 -56
- docker_start.sh +1 -1
Dockerfile
CHANGED
@@ -1,9 +1,12 @@
|
|
1 |
-
|
2 |
-
FROM python:3.9-bullseye
|
3 |
|
4 |
# Allow statements and log messages to immediately appear in the Knative logs
|
5 |
ENV PYTHONUNBUFFERED True
|
6 |
|
|
|
|
|
|
|
|
|
7 |
# See: https://huggingface.co/docs/hub/spaces-sdks-docker#permissions
|
8 |
RUN useradd -m -u 1000 user
|
9 |
USER user
|
@@ -39,4 +42,5 @@ COPY --chown=user docker_start.sh ./
|
|
39 |
RUN mkdir -p ./data
|
40 |
RUN chown -R user ./data
|
41 |
|
|
|
42 |
CMD ["bash", "docker_start.sh"]
|
|
|
1 |
+
FROM python:3.11-slim-bullseye
|
|
|
2 |
|
3 |
# Allow statements and log messages to immediately appear in the Knative logs
|
4 |
ENV PYTHONUNBUFFERED True
|
5 |
|
6 |
+
# Adds GCC and other build tools so we can compile hnswlib and other native/C++ deps.
|
7 |
+
RUN apt-get update --fix-missing && apt-get install -y --fix-missing build-essential && \
|
8 |
+
rm -rf /var/lib/apt/lists/*
|
9 |
+
|
10 |
# See: https://huggingface.co/docs/hub/spaces-sdks-docker#permissions
|
11 |
RUN useradd -m -u 1000 user
|
12 |
USER user
|
|
|
42 |
RUN mkdir -p ./data
|
43 |
RUN chown -R user ./data
|
44 |
|
45 |
+
EXPOSE 8000
|
46 |
CMD ["bash", "docker_start.sh"]
|
data/lilac.yml
CHANGED
@@ -230,10 +230,13 @@ datasets:
|
|
230 |
signal_name: concept_score
|
231 |
- path: text
|
232 |
signal:
|
233 |
-
embedding: gte-small
|
234 |
-
eps: 0.05
|
235 |
-
min_samples: 5
|
236 |
signal_name: cluster_dbscan
|
|
|
|
|
|
|
|
|
|
|
|
|
237 |
settings:
|
238 |
ui:
|
239 |
media_paths:
|
@@ -407,10 +410,13 @@ datasets:
|
|
407 |
signal_name: concept_score
|
408 |
- path: text
|
409 |
signal:
|
410 |
-
embedding: gte-small
|
411 |
-
eps: 0.05
|
412 |
-
min_samples: 5
|
413 |
signal_name: cluster_dbscan
|
|
|
|
|
|
|
|
|
|
|
|
|
414 |
settings:
|
415 |
ui:
|
416 |
media_paths:
|
@@ -576,10 +582,13 @@ datasets:
|
|
576 |
signal_name: concept_score
|
577 |
- path: text
|
578 |
signal:
|
579 |
-
embedding: gte-small
|
580 |
-
eps: 0.05
|
581 |
-
min_samples: 5
|
582 |
signal_name: cluster_dbscan
|
|
|
|
|
|
|
|
|
|
|
|
|
583 |
settings:
|
584 |
ui:
|
585 |
media_paths:
|
@@ -605,6 +614,20 @@ datasets:
|
|
605 |
- value
|
606 |
- '*'
|
607 |
embedding: gte-small
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
608 |
signals:
|
609 |
- path: original-instruction
|
610 |
signal:
|
@@ -2856,9 +2879,6 @@ datasets:
|
|
2856 |
signal_name: concept_score
|
2857 |
- path: original-instruction
|
2858 |
signal:
|
2859 |
-
embedding: gte-small
|
2860 |
-
eps: 0.05
|
2861 |
-
min_samples: 5
|
2862 |
signal_name: cluster_dbscan
|
2863 |
- path: original-instruction
|
2864 |
signal:
|
@@ -2926,15 +2946,9 @@ datasets:
|
|
2926 |
signal_name: concept_score
|
2927 |
- path: original-context
|
2928 |
signal:
|
2929 |
-
embedding: gte-small
|
2930 |
-
eps: 0.05
|
2931 |
-
min_samples: 5
|
2932 |
signal_name: cluster_dbscan
|
2933 |
- path: original-response
|
2934 |
signal:
|
2935 |
-
embedding: gte-small
|
2936 |
-
eps: 0.05
|
2937 |
-
min_samples: 5
|
2938 |
signal_name: cluster_dbscan
|
2939 |
- path: original-response
|
2940 |
signal:
|
@@ -3000,15 +3014,355 @@ datasets:
|
|
3000 |
version: null
|
3001 |
draft: main
|
3002 |
signal_name: concept_score
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
3003 |
- path:
|
3004 |
- new-instruction
|
3005 |
- value
|
3006 |
- '*'
|
3007 |
signal:
|
3008 |
embedding: gte-small
|
3009 |
-
|
3010 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
3011 |
signal_name: cluster_dbscan
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
3012 |
- path:
|
3013 |
- new-instruction
|
3014 |
- value
|
@@ -3103,18 +3457,18 @@ datasets:
|
|
3103 |
- '*'
|
3104 |
signal:
|
3105 |
embedding: gte-small
|
3106 |
-
|
3107 |
-
|
3108 |
-
signal_name:
|
3109 |
- path:
|
3110 |
- new-response
|
3111 |
- value
|
3112 |
- '*'
|
3113 |
signal:
|
3114 |
embedding: gte-small
|
3115 |
-
|
3116 |
-
|
3117 |
-
signal_name:
|
3118 |
- path:
|
3119 |
- new-response
|
3120 |
- value
|
@@ -3784,16 +4138,22 @@ datasets:
|
|
3784 |
signal_name: concept_score
|
3785 |
- path: question
|
3786 |
signal:
|
3787 |
-
embedding: gte-small
|
3788 |
-
eps: 0.05
|
3789 |
-
min_samples: 5
|
3790 |
signal_name: cluster_dbscan
|
3791 |
- path: response
|
3792 |
signal:
|
3793 |
-
embedding: gte-small
|
3794 |
-
eps: 0.05
|
3795 |
-
min_samples: 5
|
3796 |
signal_name: cluster_dbscan
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
3797 |
settings:
|
3798 |
ui:
|
3799 |
media_paths:
|
@@ -4190,18 +4550,28 @@ datasets:
|
|
4190 |
- translation
|
4191 |
- es
|
4192 |
signal:
|
4193 |
-
embedding: gte-small
|
4194 |
-
eps: 0.05
|
4195 |
-
min_samples: 5
|
4196 |
signal_name: cluster_dbscan
|
4197 |
- path:
|
4198 |
- translation
|
4199 |
- en
|
4200 |
signal:
|
4201 |
-
embedding: gte-small
|
4202 |
-
eps: 0.05
|
4203 |
-
min_samples: 5
|
4204 |
signal_name: cluster_dbscan
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
4205 |
settings:
|
4206 |
ui:
|
4207 |
media_paths:
|
@@ -4370,10 +4740,13 @@ datasets:
|
|
4370 |
signal_name: concept_score
|
4371 |
- path: lecture
|
4372 |
signal:
|
4373 |
-
embedding: gte-small
|
4374 |
-
eps: 0.05
|
4375 |
-
min_samples: 5
|
4376 |
signal_name: cluster_dbscan
|
|
|
|
|
|
|
|
|
|
|
|
|
4377 |
settings:
|
4378 |
ui:
|
4379 |
media_paths:
|
@@ -4539,10 +4912,13 @@ datasets:
|
|
4539 |
signal_name: concept_score
|
4540 |
- path: text
|
4541 |
signal:
|
4542 |
-
embedding: gte-small
|
4543 |
-
eps: 0.05
|
4544 |
-
min_samples: 5
|
4545 |
signal_name: cluster_dbscan
|
|
|
|
|
|
|
|
|
|
|
|
|
4546 |
settings:
|
4547 |
ui:
|
4548 |
media_paths:
|
@@ -4707,10 +5083,13 @@ datasets:
|
|
4707 |
signal_name: concept_score
|
4708 |
- path: overview
|
4709 |
signal:
|
4710 |
-
embedding: gte-small
|
4711 |
-
eps: 0.05
|
4712 |
-
min_samples: 5
|
4713 |
signal_name: cluster_dbscan
|
|
|
|
|
|
|
|
|
|
|
|
|
4714 |
settings:
|
4715 |
ui:
|
4716 |
media_paths:
|
@@ -5026,24 +5405,37 @@ datasets:
|
|
5026 |
- outline
|
5027 |
- '*'
|
5028 |
signal:
|
5029 |
-
embedding: gte-small
|
5030 |
-
eps: 0.05
|
5031 |
-
min_samples: 5
|
5032 |
signal_name: cluster_dbscan
|
5033 |
- path:
|
5034 |
- concepts
|
5035 |
- '*'
|
5036 |
signal:
|
5037 |
-
embedding: gte-small
|
5038 |
-
eps: 0.05
|
5039 |
-
min_samples: 5
|
5040 |
signal_name: cluster_dbscan
|
5041 |
- path: markdown
|
5042 |
signal:
|
5043 |
-
embedding: gte-small
|
5044 |
-
eps: 0.05
|
5045 |
-
min_samples: 5
|
5046 |
signal_name: cluster_dbscan
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
5047 |
settings:
|
5048 |
ui:
|
5049 |
media_paths:
|
|
|
230 |
signal_name: concept_score
|
231 |
- path: text
|
232 |
signal:
|
|
|
|
|
|
|
233 |
signal_name: cluster_dbscan
|
234 |
+
- path: text
|
235 |
+
signal:
|
236 |
+
embedding: gte-small
|
237 |
+
min_cluster_size: 5
|
238 |
+
umap_n_components: 10
|
239 |
+
signal_name: cluster_hdbscan
|
240 |
settings:
|
241 |
ui:
|
242 |
media_paths:
|
|
|
410 |
signal_name: concept_score
|
411 |
- path: text
|
412 |
signal:
|
|
|
|
|
|
|
413 |
signal_name: cluster_dbscan
|
414 |
+
- path: text
|
415 |
+
signal:
|
416 |
+
embedding: gte-small
|
417 |
+
min_cluster_size: 5
|
418 |
+
umap_n_components: 10
|
419 |
+
signal_name: cluster_hdbscan
|
420 |
settings:
|
421 |
ui:
|
422 |
media_paths:
|
|
|
582 |
signal_name: concept_score
|
583 |
- path: text
|
584 |
signal:
|
|
|
|
|
|
|
585 |
signal_name: cluster_dbscan
|
586 |
+
- path: text
|
587 |
+
signal:
|
588 |
+
embedding: gte-small
|
589 |
+
min_cluster_size: 5
|
590 |
+
umap_n_components: 10
|
591 |
+
signal_name: cluster_hdbscan
|
592 |
settings:
|
593 |
ui:
|
594 |
media_paths:
|
|
|
614 |
- value
|
615 |
- '*'
|
616 |
embedding: gte-small
|
617 |
+
- path: original-instruction
|
618 |
+
embedding: gte-small
|
619 |
+
- path: original-response
|
620 |
+
embedding: gte-small
|
621 |
+
- path:
|
622 |
+
- new-instruction
|
623 |
+
- value
|
624 |
+
- '*'
|
625 |
+
embedding: gte-small
|
626 |
+
- path:
|
627 |
+
- new-response
|
628 |
+
- value
|
629 |
+
- '*'
|
630 |
+
embedding: gte-small
|
631 |
signals:
|
632 |
- path: original-instruction
|
633 |
signal:
|
|
|
2879 |
signal_name: concept_score
|
2880 |
- path: original-instruction
|
2881 |
signal:
|
|
|
|
|
|
|
2882 |
signal_name: cluster_dbscan
|
2883 |
- path: original-instruction
|
2884 |
signal:
|
|
|
2946 |
signal_name: concept_score
|
2947 |
- path: original-context
|
2948 |
signal:
|
|
|
|
|
|
|
2949 |
signal_name: cluster_dbscan
|
2950 |
- path: original-response
|
2951 |
signal:
|
|
|
|
|
|
|
2952 |
signal_name: cluster_dbscan
|
2953 |
- path: original-response
|
2954 |
signal:
|
|
|
3014 |
version: null
|
3015 |
draft: main
|
3016 |
signal_name: concept_score
|
3017 |
+
- path:
|
3018 |
+
- new-instruction
|
3019 |
+
- value
|
3020 |
+
- '*'
|
3021 |
+
signal:
|
3022 |
+
signal_name: cluster_dbscan
|
3023 |
+
- path:
|
3024 |
+
- new-instruction
|
3025 |
+
- value
|
3026 |
+
- '*'
|
3027 |
+
signal:
|
3028 |
+
embedding: gte-small
|
3029 |
+
namespace: lilac
|
3030 |
+
concept_name: legal-termination
|
3031 |
+
version: null
|
3032 |
+
draft: main
|
3033 |
+
signal_name: concept_score
|
3034 |
- path:
|
3035 |
- new-instruction
|
3036 |
- value
|
3037 |
- '*'
|
3038 |
signal:
|
3039 |
embedding: gte-small
|
3040 |
+
namespace: lilac
|
3041 |
+
concept_name: negative-sentiment
|
3042 |
+
version: null
|
3043 |
+
draft: main
|
3044 |
+
signal_name: concept_score
|
3045 |
+
- path:
|
3046 |
+
- new-instruction
|
3047 |
+
- value
|
3048 |
+
- '*'
|
3049 |
+
signal:
|
3050 |
+
embedding: gte-small
|
3051 |
+
namespace: lilac
|
3052 |
+
concept_name: non-english
|
3053 |
+
version: null
|
3054 |
+
draft: main
|
3055 |
+
signal_name: concept_score
|
3056 |
+
- path:
|
3057 |
+
- new-instruction
|
3058 |
+
- value
|
3059 |
+
- '*'
|
3060 |
+
signal:
|
3061 |
+
embedding: gte-small
|
3062 |
+
namespace: lilac
|
3063 |
+
concept_name: positive-sentiment
|
3064 |
+
version: null
|
3065 |
+
draft: main
|
3066 |
+
signal_name: concept_score
|
3067 |
+
- path:
|
3068 |
+
- new-instruction
|
3069 |
+
- value
|
3070 |
+
- '*'
|
3071 |
+
signal:
|
3072 |
+
embedding: gte-small
|
3073 |
+
namespace: lilac
|
3074 |
+
concept_name: profanity
|
3075 |
+
version: null
|
3076 |
+
draft: main
|
3077 |
+
signal_name: concept_score
|
3078 |
+
- path:
|
3079 |
+
- new-instruction
|
3080 |
+
- value
|
3081 |
+
- '*'
|
3082 |
+
signal:
|
3083 |
+
embedding: gte-small
|
3084 |
+
namespace: lilac
|
3085 |
+
concept_name: question
|
3086 |
+
version: null
|
3087 |
+
draft: main
|
3088 |
+
signal_name: concept_score
|
3089 |
+
- path:
|
3090 |
+
- new-instruction
|
3091 |
+
- value
|
3092 |
+
- '*'
|
3093 |
+
signal:
|
3094 |
+
embedding: gte-small
|
3095 |
+
namespace: lilac
|
3096 |
+
concept_name: source-code
|
3097 |
+
version: null
|
3098 |
+
draft: main
|
3099 |
+
signal_name: concept_score
|
3100 |
+
- path:
|
3101 |
+
- new-instruction
|
3102 |
+
- value
|
3103 |
+
- '*'
|
3104 |
+
signal:
|
3105 |
+
embedding: gte-small
|
3106 |
+
namespace: lilac
|
3107 |
+
concept_name: toxicity
|
3108 |
+
version: null
|
3109 |
+
draft: main
|
3110 |
+
signal_name: concept_score
|
3111 |
+
- path:
|
3112 |
+
- new-context
|
3113 |
+
- value
|
3114 |
+
- '*'
|
3115 |
+
signal:
|
3116 |
signal_name: cluster_dbscan
|
3117 |
+
- path:
|
3118 |
+
- new-response
|
3119 |
+
- value
|
3120 |
+
- '*'
|
3121 |
+
signal:
|
3122 |
+
signal_name: cluster_dbscan
|
3123 |
+
- path:
|
3124 |
+
- new-response
|
3125 |
+
- value
|
3126 |
+
- '*'
|
3127 |
+
signal:
|
3128 |
+
embedding: gte-small
|
3129 |
+
namespace: lilac
|
3130 |
+
concept_name: legal-termination
|
3131 |
+
version: null
|
3132 |
+
draft: main
|
3133 |
+
signal_name: concept_score
|
3134 |
+
- path:
|
3135 |
+
- new-response
|
3136 |
+
- value
|
3137 |
+
- '*'
|
3138 |
+
signal:
|
3139 |
+
embedding: gte-small
|
3140 |
+
namespace: lilac
|
3141 |
+
concept_name: negative-sentiment
|
3142 |
+
version: null
|
3143 |
+
draft: main
|
3144 |
+
signal_name: concept_score
|
3145 |
+
- path:
|
3146 |
+
- new-response
|
3147 |
+
- value
|
3148 |
+
- '*'
|
3149 |
+
signal:
|
3150 |
+
embedding: gte-small
|
3151 |
+
namespace: lilac
|
3152 |
+
concept_name: non-english
|
3153 |
+
version: null
|
3154 |
+
draft: main
|
3155 |
+
signal_name: concept_score
|
3156 |
+
- path:
|
3157 |
+
- new-response
|
3158 |
+
- value
|
3159 |
+
- '*'
|
3160 |
+
signal:
|
3161 |
+
embedding: gte-small
|
3162 |
+
namespace: lilac
|
3163 |
+
concept_name: positive-sentiment
|
3164 |
+
version: null
|
3165 |
+
draft: main
|
3166 |
+
signal_name: concept_score
|
3167 |
+
- path:
|
3168 |
+
- new-response
|
3169 |
+
- value
|
3170 |
+
- '*'
|
3171 |
+
signal:
|
3172 |
+
embedding: gte-small
|
3173 |
+
namespace: lilac
|
3174 |
+
concept_name: profanity
|
3175 |
+
version: null
|
3176 |
+
draft: main
|
3177 |
+
signal_name: concept_score
|
3178 |
+
- path:
|
3179 |
+
- new-response
|
3180 |
+
- value
|
3181 |
+
- '*'
|
3182 |
+
signal:
|
3183 |
+
embedding: gte-small
|
3184 |
+
namespace: lilac
|
3185 |
+
concept_name: question
|
3186 |
+
version: null
|
3187 |
+
draft: main
|
3188 |
+
signal_name: concept_score
|
3189 |
+
- path:
|
3190 |
+
- new-response
|
3191 |
+
- value
|
3192 |
+
- '*'
|
3193 |
+
signal:
|
3194 |
+
embedding: gte-small
|
3195 |
+
namespace: lilac
|
3196 |
+
concept_name: source-code
|
3197 |
+
version: null
|
3198 |
+
draft: main
|
3199 |
+
signal_name: concept_score
|
3200 |
+
- path:
|
3201 |
+
- new-response
|
3202 |
+
- value
|
3203 |
+
- '*'
|
3204 |
+
signal:
|
3205 |
+
embedding: gte-small
|
3206 |
+
namespace: lilac
|
3207 |
+
concept_name: toxicity
|
3208 |
+
version: null
|
3209 |
+
draft: main
|
3210 |
+
signal_name: concept_score
|
3211 |
+
- path: original-instruction
|
3212 |
+
signal:
|
3213 |
+
embedding: gte-small
|
3214 |
+
min_cluster_size: 5
|
3215 |
+
umap_n_components: 10
|
3216 |
+
signal_name: cluster_hdbscan
|
3217 |
+
- path: original-instruction
|
3218 |
+
signal:
|
3219 |
+
embedding: gte-small
|
3220 |
+
namespace: lilac
|
3221 |
+
concept_name: legal-termination
|
3222 |
+
version: null
|
3223 |
+
draft: main
|
3224 |
+
signal_name: concept_score
|
3225 |
+
- path: original-instruction
|
3226 |
+
signal:
|
3227 |
+
embedding: gte-small
|
3228 |
+
namespace: lilac
|
3229 |
+
concept_name: negative-sentiment
|
3230 |
+
version: null
|
3231 |
+
draft: main
|
3232 |
+
signal_name: concept_score
|
3233 |
+
- path: original-instruction
|
3234 |
+
signal:
|
3235 |
+
embedding: gte-small
|
3236 |
+
namespace: lilac
|
3237 |
+
concept_name: non-english
|
3238 |
+
version: null
|
3239 |
+
draft: main
|
3240 |
+
signal_name: concept_score
|
3241 |
+
- path: original-instruction
|
3242 |
+
signal:
|
3243 |
+
embedding: gte-small
|
3244 |
+
namespace: lilac
|
3245 |
+
concept_name: positive-sentiment
|
3246 |
+
version: null
|
3247 |
+
draft: main
|
3248 |
+
signal_name: concept_score
|
3249 |
+
- path: original-instruction
|
3250 |
+
signal:
|
3251 |
+
embedding: gte-small
|
3252 |
+
namespace: lilac
|
3253 |
+
concept_name: profanity
|
3254 |
+
version: null
|
3255 |
+
draft: main
|
3256 |
+
signal_name: concept_score
|
3257 |
+
- path: original-instruction
|
3258 |
+
signal:
|
3259 |
+
embedding: gte-small
|
3260 |
+
namespace: lilac
|
3261 |
+
concept_name: question
|
3262 |
+
version: null
|
3263 |
+
draft: main
|
3264 |
+
signal_name: concept_score
|
3265 |
+
- path: original-instruction
|
3266 |
+
signal:
|
3267 |
+
embedding: gte-small
|
3268 |
+
namespace: lilac
|
3269 |
+
concept_name: source-code
|
3270 |
+
version: null
|
3271 |
+
draft: main
|
3272 |
+
signal_name: concept_score
|
3273 |
+
- path: original-instruction
|
3274 |
+
signal:
|
3275 |
+
embedding: gte-small
|
3276 |
+
namespace: lilac
|
3277 |
+
concept_name: toxicity
|
3278 |
+
version: null
|
3279 |
+
draft: main
|
3280 |
+
signal_name: concept_score
|
3281 |
+
- path: original-context
|
3282 |
+
signal:
|
3283 |
+
embedding: gte-small
|
3284 |
+
min_cluster_size: 5
|
3285 |
+
umap_n_components: 10
|
3286 |
+
signal_name: cluster_hdbscan
|
3287 |
+
- path: original-response
|
3288 |
+
signal:
|
3289 |
+
embedding: gte-small
|
3290 |
+
min_cluster_size: 5
|
3291 |
+
umap_n_components: 10
|
3292 |
+
signal_name: cluster_hdbscan
|
3293 |
+
- path: original-response
|
3294 |
+
signal:
|
3295 |
+
embedding: gte-small
|
3296 |
+
namespace: lilac
|
3297 |
+
concept_name: legal-termination
|
3298 |
+
version: null
|
3299 |
+
draft: main
|
3300 |
+
signal_name: concept_score
|
3301 |
+
- path: original-response
|
3302 |
+
signal:
|
3303 |
+
embedding: gte-small
|
3304 |
+
namespace: lilac
|
3305 |
+
concept_name: negative-sentiment
|
3306 |
+
version: null
|
3307 |
+
draft: main
|
3308 |
+
signal_name: concept_score
|
3309 |
+
- path: original-response
|
3310 |
+
signal:
|
3311 |
+
embedding: gte-small
|
3312 |
+
namespace: lilac
|
3313 |
+
concept_name: non-english
|
3314 |
+
version: null
|
3315 |
+
draft: main
|
3316 |
+
signal_name: concept_score
|
3317 |
+
- path: original-response
|
3318 |
+
signal:
|
3319 |
+
embedding: gte-small
|
3320 |
+
namespace: lilac
|
3321 |
+
concept_name: positive-sentiment
|
3322 |
+
version: null
|
3323 |
+
draft: main
|
3324 |
+
signal_name: concept_score
|
3325 |
+
- path: original-response
|
3326 |
+
signal:
|
3327 |
+
embedding: gte-small
|
3328 |
+
namespace: lilac
|
3329 |
+
concept_name: profanity
|
3330 |
+
version: null
|
3331 |
+
draft: main
|
3332 |
+
signal_name: concept_score
|
3333 |
+
- path: original-response
|
3334 |
+
signal:
|
3335 |
+
embedding: gte-small
|
3336 |
+
namespace: lilac
|
3337 |
+
concept_name: question
|
3338 |
+
version: null
|
3339 |
+
draft: main
|
3340 |
+
signal_name: concept_score
|
3341 |
+
- path: original-response
|
3342 |
+
signal:
|
3343 |
+
embedding: gte-small
|
3344 |
+
namespace: lilac
|
3345 |
+
concept_name: source-code
|
3346 |
+
version: null
|
3347 |
+
draft: main
|
3348 |
+
signal_name: concept_score
|
3349 |
+
- path: original-response
|
3350 |
+
signal:
|
3351 |
+
embedding: gte-small
|
3352 |
+
namespace: lilac
|
3353 |
+
concept_name: toxicity
|
3354 |
+
version: null
|
3355 |
+
draft: main
|
3356 |
+
signal_name: concept_score
|
3357 |
+
- path:
|
3358 |
+
- new-instruction
|
3359 |
+
- value
|
3360 |
+
- '*'
|
3361 |
+
signal:
|
3362 |
+
embedding: gte-small
|
3363 |
+
min_cluster_size: 5
|
3364 |
+
umap_n_components: 10
|
3365 |
+
signal_name: cluster_hdbscan
|
3366 |
- path:
|
3367 |
- new-instruction
|
3368 |
- value
|
|
|
3457 |
- '*'
|
3458 |
signal:
|
3459 |
embedding: gte-small
|
3460 |
+
min_cluster_size: 5
|
3461 |
+
umap_n_components: 10
|
3462 |
+
signal_name: cluster_hdbscan
|
3463 |
- path:
|
3464 |
- new-response
|
3465 |
- value
|
3466 |
- '*'
|
3467 |
signal:
|
3468 |
embedding: gte-small
|
3469 |
+
min_cluster_size: 5
|
3470 |
+
umap_n_components: 10
|
3471 |
+
signal_name: cluster_hdbscan
|
3472 |
- path:
|
3473 |
- new-response
|
3474 |
- value
|
|
|
4138 |
signal_name: concept_score
|
4139 |
- path: question
|
4140 |
signal:
|
|
|
|
|
|
|
4141 |
signal_name: cluster_dbscan
|
4142 |
- path: response
|
4143 |
signal:
|
|
|
|
|
|
|
4144 |
signal_name: cluster_dbscan
|
4145 |
+
- path: question
|
4146 |
+
signal:
|
4147 |
+
embedding: gte-small
|
4148 |
+
min_cluster_size: 5
|
4149 |
+
umap_n_components: 10
|
4150 |
+
signal_name: cluster_hdbscan
|
4151 |
+
- path: response
|
4152 |
+
signal:
|
4153 |
+
embedding: gte-small
|
4154 |
+
min_cluster_size: 5
|
4155 |
+
umap_n_components: 10
|
4156 |
+
signal_name: cluster_hdbscan
|
4157 |
settings:
|
4158 |
ui:
|
4159 |
media_paths:
|
|
|
4550 |
- translation
|
4551 |
- es
|
4552 |
signal:
|
|
|
|
|
|
|
4553 |
signal_name: cluster_dbscan
|
4554 |
- path:
|
4555 |
- translation
|
4556 |
- en
|
4557 |
signal:
|
|
|
|
|
|
|
4558 |
signal_name: cluster_dbscan
|
4559 |
+
- path:
|
4560 |
+
- translation
|
4561 |
+
- es
|
4562 |
+
signal:
|
4563 |
+
embedding: gte-small
|
4564 |
+
min_cluster_size: 5
|
4565 |
+
umap_n_components: 10
|
4566 |
+
signal_name: cluster_hdbscan
|
4567 |
+
- path:
|
4568 |
+
- translation
|
4569 |
+
- en
|
4570 |
+
signal:
|
4571 |
+
embedding: gte-small
|
4572 |
+
min_cluster_size: 5
|
4573 |
+
umap_n_components: 10
|
4574 |
+
signal_name: cluster_hdbscan
|
4575 |
settings:
|
4576 |
ui:
|
4577 |
media_paths:
|
|
|
4740 |
signal_name: concept_score
|
4741 |
- path: lecture
|
4742 |
signal:
|
|
|
|
|
|
|
4743 |
signal_name: cluster_dbscan
|
4744 |
+
- path: lecture
|
4745 |
+
signal:
|
4746 |
+
embedding: gte-small
|
4747 |
+
min_cluster_size: 5
|
4748 |
+
umap_n_components: 10
|
4749 |
+
signal_name: cluster_hdbscan
|
4750 |
settings:
|
4751 |
ui:
|
4752 |
media_paths:
|
|
|
4912 |
signal_name: concept_score
|
4913 |
- path: text
|
4914 |
signal:
|
|
|
|
|
|
|
4915 |
signal_name: cluster_dbscan
|
4916 |
+
- path: text
|
4917 |
+
signal:
|
4918 |
+
embedding: gte-small
|
4919 |
+
min_cluster_size: 5
|
4920 |
+
umap_n_components: 10
|
4921 |
+
signal_name: cluster_hdbscan
|
4922 |
settings:
|
4923 |
ui:
|
4924 |
media_paths:
|
|
|
5083 |
signal_name: concept_score
|
5084 |
- path: overview
|
5085 |
signal:
|
|
|
|
|
|
|
5086 |
signal_name: cluster_dbscan
|
5087 |
+
- path: overview
|
5088 |
+
signal:
|
5089 |
+
embedding: gte-small
|
5090 |
+
min_cluster_size: 5
|
5091 |
+
umap_n_components: 10
|
5092 |
+
signal_name: cluster_hdbscan
|
5093 |
settings:
|
5094 |
ui:
|
5095 |
media_paths:
|
|
|
5405 |
- outline
|
5406 |
- '*'
|
5407 |
signal:
|
|
|
|
|
|
|
5408 |
signal_name: cluster_dbscan
|
5409 |
- path:
|
5410 |
- concepts
|
5411 |
- '*'
|
5412 |
signal:
|
|
|
|
|
|
|
5413 |
signal_name: cluster_dbscan
|
5414 |
- path: markdown
|
5415 |
signal:
|
|
|
|
|
|
|
5416 |
signal_name: cluster_dbscan
|
5417 |
+
- path:
|
5418 |
+
- outline
|
5419 |
+
- '*'
|
5420 |
+
signal:
|
5421 |
+
embedding: gte-small
|
5422 |
+
min_cluster_size: 5
|
5423 |
+
umap_n_components: 10
|
5424 |
+
signal_name: cluster_hdbscan
|
5425 |
+
- path:
|
5426 |
+
- concepts
|
5427 |
+
- '*'
|
5428 |
+
signal:
|
5429 |
+
embedding: gte-small
|
5430 |
+
min_cluster_size: 5
|
5431 |
+
umap_n_components: 10
|
5432 |
+
signal_name: cluster_hdbscan
|
5433 |
+
- path: markdown
|
5434 |
+
signal:
|
5435 |
+
embedding: gte-small
|
5436 |
+
min_cluster_size: 5
|
5437 |
+
umap_n_components: 10
|
5438 |
+
signal_name: cluster_hdbscan
|
5439 |
settings:
|
5440 |
ui:
|
5441 |
media_paths:
|
docker_start.sh
CHANGED
@@ -5,6 +5,6 @@ set -e
|
|
5 |
|
6 |
lilac hf-docker-start
|
7 |
gunicorn lilac.server:app \
|
8 |
-
--bind 0.0.0.0:
|
9 |
--preload -k uvicorn.workers.UvicornWorker \
|
10 |
--timeout 120
|
|
|
5 |
|
6 |
lilac hf-docker-start
|
7 |
gunicorn lilac.server:app \
|
8 |
+
--bind 0.0.0.0:8000 \
|
9 |
--preload -k uvicorn.workers.UvicornWorker \
|
10 |
--timeout 120
|