Upload conditioning_samples.json with huggingface_hub
Browse files- conditioning_samples.json +66 -66
conditioning_samples.json
CHANGED
|
@@ -1,140 +1,140 @@
|
|
| 1 |
{
|
| 2 |
-
"step":
|
| 3 |
"samples": [
|
| 4 |
{
|
| 5 |
-
"step":
|
| 6 |
"mode": "procedural_prefix",
|
| 7 |
-
"caption": "A medium-quality recording of a
|
| 8 |
-
"prefix": "[
|
| 9 |
-
"transcript": "
|
| 10 |
"adaln_summary": "(all zeros)",
|
| 11 |
"adaln_nonzero": 0
|
| 12 |
},
|
| 13 |
{
|
| 14 |
-
"step":
|
| 15 |
"mode": "procedural_prefix",
|
| 16 |
-
"caption": "A medium-quality recording of a male speaker
|
| 17 |
-
"prefix": "[
|
| 18 |
-
"transcript": "
|
| 19 |
"adaln_summary": "(all zeros)",
|
| 20 |
"adaln_nonzero": 0
|
| 21 |
},
|
| 22 |
{
|
| 23 |
-
"step":
|
| 24 |
"mode": "procedural_prefix",
|
| 25 |
-
"caption": "A medium-quality recording of a female speaker
|
| 26 |
-
"prefix": "[
|
| 27 |
-
"transcript": "
|
| 28 |
"adaln_summary": "(all zeros)",
|
| 29 |
"adaln_nonzero": 0
|
| 30 |
},
|
| 31 |
{
|
| 32 |
-
"step":
|
| 33 |
"mode": "static_caption",
|
| 34 |
-
"caption": "A
|
| 35 |
-
"prefix": "[The speaker sounds
|
| 36 |
-
"transcript": "
|
| 37 |
"adaln_summary": "(all zeros)",
|
| 38 |
"adaln_nonzero": 0
|
| 39 |
},
|
| 40 |
{
|
| 41 |
-
"step":
|
| 42 |
"mode": "static_caption",
|
| 43 |
-
"caption": "A
|
| 44 |
-
"prefix": "[
|
| 45 |
-
"transcript": "
|
| 46 |
"adaln_summary": "(all zeros)",
|
| 47 |
"adaln_nonzero": 0
|
| 48 |
},
|
| 49 |
{
|
| 50 |
-
"step":
|
| 51 |
"mode": "static_caption",
|
| 52 |
-
"caption": "A
|
| 53 |
-
"prefix": "[
|
| 54 |
-
"transcript": "
|
| 55 |
"adaln_summary": "(all zeros)",
|
| 56 |
"adaln_nonzero": 0
|
| 57 |
},
|
| 58 |
{
|
| 59 |
-
"step":
|
| 60 |
"mode": "adaln_only",
|
| 61 |
-
"caption": "A
|
| 62 |
"prefix": "",
|
| 63 |
-
"transcript": "
|
| 64 |
-
"adaln_summary": "Amusement=0.
|
| 65 |
-
"adaln_nonzero":
|
| 66 |
},
|
| 67 |
{
|
| 68 |
-
"step":
|
| 69 |
"mode": "adaln_only",
|
| 70 |
-
"caption": "A medium-quality recording of a male speaker
|
| 71 |
"prefix": "",
|
| 72 |
-
"transcript": "
|
| 73 |
-
"adaln_summary": "Elation=0.01, Thankfulness_Gratitude=0.
|
| 74 |
-
"adaln_nonzero":
|
| 75 |
},
|
| 76 |
{
|
| 77 |
-
"step":
|
| 78 |
"mode": "adaln_only",
|
| 79 |
-
"caption": "A
|
| 80 |
"prefix": "",
|
| 81 |
-
"transcript": "
|
| 82 |
-
"adaln_summary": "Amusement=
|
| 83 |
-
"adaln_nonzero":
|
| 84 |
},
|
| 85 |
{
|
| 86 |
-
"step":
|
| 87 |
"mode": "baseline",
|
| 88 |
-
"caption": "A
|
| 89 |
"prefix": "",
|
| 90 |
-
"transcript": "
|
| 91 |
"adaln_summary": "(all zeros)",
|
| 92 |
"adaln_nonzero": 0
|
| 93 |
},
|
| 94 |
{
|
| 95 |
-
"step":
|
| 96 |
"mode": "baseline",
|
| 97 |
-
"caption": "A medium-quality recording of a
|
| 98 |
"prefix": "",
|
| 99 |
-
"transcript": "
|
| 100 |
"adaln_summary": "(all zeros)",
|
| 101 |
"adaln_nonzero": 0
|
| 102 |
},
|
| 103 |
{
|
| 104 |
-
"step":
|
| 105 |
"mode": "baseline",
|
| 106 |
-
"caption": "A high-quality recording of a
|
| 107 |
"prefix": "",
|
| 108 |
-
"transcript": "
|
| 109 |
"adaln_summary": "(all zeros)",
|
| 110 |
"adaln_nonzero": 0
|
| 111 |
},
|
| 112 |
{
|
| 113 |
-
"step":
|
| 114 |
"mode": "dual",
|
| 115 |
-
"caption": "A
|
| 116 |
-
"prefix": "[
|
| 117 |
-
"transcript": "
|
| 118 |
-
"adaln_summary": "Elation=0.
|
| 119 |
-
"adaln_nonzero":
|
| 120 |
},
|
| 121 |
{
|
| 122 |
-
"step":
|
| 123 |
"mode": "dual",
|
| 124 |
-
"caption": "A medium-quality recording of a male speaker discussing
|
| 125 |
-
"prefix": "[
|
| 126 |
-
"transcript": "
|
| 127 |
-
"adaln_summary": "Elation=0.
|
| 128 |
"adaln_nonzero": 38
|
| 129 |
},
|
| 130 |
{
|
| 131 |
-
"step":
|
| 132 |
"mode": "dual",
|
| 133 |
-
"caption": "A medium-quality recording of a
|
| 134 |
-
"prefix": "[
|
| 135 |
-
"transcript": "
|
| 136 |
-
"adaln_summary": "Amusement=0.
|
| 137 |
-
"adaln_nonzero":
|
| 138 |
}
|
| 139 |
]
|
| 140 |
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"step": 10000,
|
| 3 |
"samples": [
|
| 4 |
{
|
| 5 |
+
"step": 10000,
|
| 6 |
"mode": "procedural_prefix",
|
| 7 |
+
"caption": "A medium-quality recording of a man telling a story with a slightly humorous tone. He sounds a bit surprised and amused by the events he's describing. There are no sound effects or music.",
|
| 8 |
+
"prefix": "[present ecstatic, good overall quality, assertive absorbed, low-pitched, hesitant, fast speech, humorous, evident startled, considerable laughing, palpable hopeful]",
|
| 9 |
+
"transcript": "So he comes out to the window and he looks down and he sees a stormtrooper walk off the ship, and he like looks up to the window and like knocks on his helmet and like kind of shrugs, like, oh I don't know. And the guy's like, Oh, geez. So he tells the other one, he's like, Oh, we I think we have a ",
|
| 10 |
"adaln_summary": "(all zeros)",
|
| 11 |
"adaln_nonzero": 0
|
| 12 |
},
|
| 13 |
{
|
| 14 |
+
"step": 10000,
|
| 15 |
"mode": "procedural_prefix",
|
| 16 |
+
"caption": "A medium-quality recording of a male speaker discussing financial matters. The speaker sounds informative and slightly enthusiastic. The recording quality is decent, with no noticeable background noise.",
|
| 17 |
+
"prefix": "[evident buoyant excellent background quality undercurrent relaxed barely meditative humorous evident zeroed-in low-pitched notable curious decent speech quality expressive]",
|
| 18 |
+
"transcript": "The report says people use it when they need to, not just because it's popular. Also when global financial stress goes up, measured by things like the VIX, a market fear index, Bitcoin use also goes up. This shows that even investors and businesses use crypto more during uncertain times. Fascinating",
|
| 19 |
"adaln_summary": "(all zeros)",
|
| 20 |
"adaln_nonzero": 0
|
| 21 |
},
|
| 22 |
{
|
| 23 |
+
"step": 10000,
|
| 24 |
"mode": "procedural_prefix",
|
| 25 |
+
"caption": "A medium-quality recording of a female speaker narrating a story. The speaker sounds neutral and informative. The recording quality is decent, and there is no background noise.",
|
| 26 |
+
"prefix": "[ghost tranquil, evident attentive, vivid interested, excellent background quality, humorous, trace pining, decent speech quality, flicker cherishing, hesitant, high arousal]",
|
| 27 |
+
"transcript": "",
|
| 28 |
"adaln_summary": "(all zeros)",
|
| 29 |
"adaln_nonzero": 0
|
| 30 |
},
|
| 31 |
{
|
| 32 |
+
"step": 10000,
|
| 33 |
"mode": "static_caption",
|
| 34 |
+
"caption": "A medium-quality recording of a male speaker discussing music and art. The speaker sounds thoughtful and analytical, with a slightly conversational tone. There are no sound effects or music.",
|
| 35 |
+
"prefix": "[The speaker sounds thoughtful and analytical, with a slightly conversational tone. A medium-quality recording of a male speaker discussing music and art. There are no sound effects or music]",
|
| 36 |
+
"transcript": "Gosh. He's he's drum. No, he hangs out with this musician, and and this I think we're supposed to get from this that Lestat does have another side to him, that he's got like a kind of a patron for the arts sort of thing going on. And in other adaptations, this is really important because Lestat is k",
|
| 37 |
"adaln_summary": "(all zeros)",
|
| 38 |
"adaln_nonzero": 0
|
| 39 |
},
|
| 40 |
{
|
| 41 |
+
"step": 10000,
|
| 42 |
"mode": "static_caption",
|
| 43 |
+
"caption": "A high-quality recording of a female speaker talking in a conversational tone. She sounds slightly enthusiastic and is explaining something. There are no sound effects or music.",
|
| 44 |
+
"prefix": "[A high-quality recording of a female speaker talking in a conversational tone. She sounds slightly enthusiastic and is explaining something. There are no sound effects or music]",
|
| 45 |
+
"transcript": "that magically as well. Yes. Definitely time blocking. So it's like saying it is okay because I've scheduled it. But what it also means is I've scheduled time to work as well. Don't worry, I'm not just flowing all day every day. I got other chunks of time where I'm working intentionally. And so then",
|
| 46 |
"adaln_summary": "(all zeros)",
|
| 47 |
"adaln_nonzero": 0
|
| 48 |
},
|
| 49 |
{
|
| 50 |
+
"step": 10000,
|
| 51 |
"mode": "static_caption",
|
| 52 |
+
"caption": "A high-quality recording of a male speaker discussing a topic with a thoughtful and slightly analytical tone. The speaker sounds engaged and articulate. There are no sound effects or music.",
|
| 53 |
+
"prefix": "[There are no sound effects or music. A high-quality recording of a male speaker discussing a topic with a thoughtful and slightly analytical tone. The speaker sounds engaged and articulate]",
|
| 54 |
+
"transcript": "Yeah, that that's so well said, you know, tying it back to the infrared that we discussed earlier, you know, if you go experience an infrared somewhere for 45 minutes, and then you compare that to what you just described, your senses are engaged in so many ways, you know, the sausage, the beer, the ",
|
| 55 |
"adaln_summary": "(all zeros)",
|
| 56 |
"adaln_nonzero": 0
|
| 57 |
},
|
| 58 |
{
|
| 59 |
+
"step": 10000,
|
| 60 |
"mode": "adaln_only",
|
| 61 |
+
"caption": "A medium-quality recording of a male speaker discussing a local party. He sounds somewhat cynical and matter-of-fact, with a slightly frustrated tone. The recording quality is decent, with no noticeable background noise.",
|
| 62 |
"prefix": "",
|
| 63 |
+
"transcript": "You just go down to the snow castle, party, drink, have fun inside a snow castle on Great Slave Lake. People DIYing everything. It's the only way you're gonna get shit ha shit up there and get things happening. You know, there's a it used to be pretty transient. I know this is getting rambling now. ",
|
| 64 |
+
"adaln_summary": "Amusement=0.10, Elation=0.32, Pleasure_Ecstasy=0.39, Thankfulness_Gratitude=0.06, Infatuation=-0.04, Hope_Enthusiasm_Optimism=0.81, Pride=0.50, Interest=2.61, Awe=-0.01, Astonishment_Surprise=1.04, Concentration=1.36, Contemplation=0.80, Relief=0.01, Longing=0.01, Teasing=0.35",
|
| 65 |
+
"adaln_nonzero": 47
|
| 66 |
},
|
| 67 |
{
|
| 68 |
+
"step": 10000,
|
| 69 |
"mode": "adaln_only",
|
| 70 |
+
"caption": "A medium-quality recording of a male speaker discussing a sports game. He sounds analytical and slightly frustrated. The audio quality is decent, with no noticeable background noise.",
|
| 71 |
"prefix": "",
|
| 72 |
+
"transcript": "",
|
| 73 |
+
"adaln_summary": "Elation=0.01, Thankfulness_Gratitude=0.04, Infatuation=-0.01, Triumph=0.75, Pride=0.51, Interest=2.62, Astonishment_Surprise=0.08, Concentration=1.70, Contemplation=0.62, Relief=0.07, Longing=-0.02, Teasing=0.51, Impatience_and_Irritability=1.46, Sexual_Lust=-0.05, Doubt=0.06",
|
| 74 |
+
"adaln_nonzero": 48
|
| 75 |
},
|
| 76 |
{
|
| 77 |
+
"step": 10000,
|
| 78 |
"mode": "adaln_only",
|
| 79 |
+
"caption": "A high-quality recording of a conversation between two people, a man and a woman. The woman sounds slightly concerned and the man sounds appreciative. The recording quality is very good, and there is no background noise.",
|
| 80 |
"prefix": "",
|
| 81 |
+
"transcript": "Yeah. Thank you. It's uh I I I I appreciate all of these answers, especially since these are difficult and very, very annoying questions that that we shouldn't have to address but do. So to all the haters, happy pride. Um I wanna I wanna end, you know, on a on a positive note.",
|
| 82 |
+
"adaln_summary": "Amusement=0.23, Elation=0.92, Pleasure_Ecstasy=0.65, Contentment=1.26, Thankfulness_Gratitude=1.67, Affection=0.91, Infatuation=-0.04, Hope_Enthusiasm_Optimism=1.59, Triumph=0.07, Pride=0.82, Interest=2.28, Concentration=1.55, Contemplation=0.84, Relief=1.05, Longing=-0.01",
|
| 83 |
+
"adaln_nonzero": 40
|
| 84 |
},
|
| 85 |
{
|
| 86 |
+
"step": 10000,
|
| 87 |
"mode": "baseline",
|
| 88 |
+
"caption": "A high-quality recording of a male speaker giving a presentation or speech. He sounds informative and slightly enthusiastic. The audio quality is very good, and there is no background noise.",
|
| 89 |
"prefix": "",
|
| 90 |
+
"transcript": "Creating attention through giveaway posts has helped us gain followers. I talk to my customers about what we do and sell. And that also seems to help us gain followers and buyers, said Costa. Nestled against the French Creek countryside of Chester County. Woodland Jewel is an artisanal mushroom farm",
|
| 91 |
"adaln_summary": "(all zeros)",
|
| 92 |
"adaln_nonzero": 0
|
| 93 |
},
|
| 94 |
{
|
| 95 |
+
"step": 10000,
|
| 96 |
"mode": "baseline",
|
| 97 |
+
"caption": "A medium-quality recording of a male speaker talking in a conversational tone. He sounds thoughtful and slightly enthusiastic. The recording quality is decent, and there is no noticeable background noise.",
|
| 98 |
"prefix": "",
|
| 99 |
+
"transcript": "identical, but similar to it. I love my church and I I love the people that are there. And I I'm getting to know folks. And so I I'm just trying to assimilate and get to know people there and the leadership and all the things that we're doing. But I would agree. I think one of the the big things tha",
|
| 100 |
"adaln_summary": "(all zeros)",
|
| 101 |
"adaln_nonzero": 0
|
| 102 |
},
|
| 103 |
{
|
| 104 |
+
"step": 10000,
|
| 105 |
"mode": "baseline",
|
| 106 |
+
"caption": "A high-quality recording of a podcast outro. The speaker is a female, and she sounds friendly and enthusiastic. The audio quality is very good, and there is no background noise.",
|
| 107 |
"prefix": "",
|
| 108 |
+
"transcript": "Marker. Okay. We'll be back next Wednesday, you guys. Thank you so much for listening to the Pivot Podcast. You can rate review and subscribe wherever you get your podcast. Follow along on Instagram at the pivot pod. We love a poll, so please participate in our polls because mostly they're just Nata",
|
| 109 |
"adaln_summary": "(all zeros)",
|
| 110 |
"adaln_nonzero": 0
|
| 111 |
},
|
| 112 |
{
|
| 113 |
+
"step": 10000,
|
| 114 |
"mode": "dual",
|
| 115 |
+
"caption": "A high-quality recording of a male speaker discussing a topic with a thoughtful and slightly frustrated tone. He sounds articulate and passionate about the subject. There are no sound effects or music.",
|
| 116 |
+
"prefix": "[mild upbeat substantial keen palpable derisive hesitant soft musing soft voice decent speech quality measured intent]",
|
| 117 |
+
"transcript": "Yeah, now that sounds great. I'm I I've always struggled to understand why you have to put the the words non-racialism and non-sexism in a document. It's it should be self-evident. I mean it's like in going to a party and introducing yourself as I'm Donald Brown, I'm not a sexist, I'm not a racist. ",
|
| 118 |
+
"adaln_summary": "Elation=0.04, Contentment=0.94, Thankfulness_Gratitude=0.67, Infatuation=-0.02, Hope_Enthusiasm_Optimism=1.37, Pride=0.53, Interest=2.35, Astonishment_Surprise=0.01, Concentration=1.96, Contemplation=1.46, Relief=0.01, Longing=-0.02, Impatience_and_Irritability=0.90, Sexual_Lust=0.03, Doubt=0.58",
|
| 119 |
+
"adaln_nonzero": 43
|
| 120 |
},
|
| 121 |
{
|
| 122 |
+
"step": 10000,
|
| 123 |
"mode": "dual",
|
| 124 |
+
"caption": "A medium-quality recording of a male speaker discussing problems with a slightly frustrated tone. The speaker sounds somewhat serious and concerned. There are no sound effects or music.",
|
| 125 |
+
"prefix": "[subdued angry breath thoughtful calm focused warm fast speech slight tranquil notable engaged low-pitched excellent overall quality excellent content enjoyment excellent background quality soft voice]",
|
| 126 |
+
"transcript": "halt gro\u00dfe, massive Probleme brachte f\u00fcr Lebewesen, vor allem auf der S\u00fcdhalbkugel und auch f\u00fcr die Menschen auf der S\u00fcdhalbkugel und auch bis heute bringend im Norden \u00fcbrigens auch. Aber hier kann man halt sehen,",
|
| 127 |
+
"adaln_summary": "Elation=0.01, Contentment=0.78, Thankfulness_Gratitude=0.05, Infatuation=-0.02, Hope_Enthusiasm_Optimism=0.51, Pride=0.56, Interest=2.35, Concentration=1.86, Contemplation=0.87, Relief=0.04, Longing=-0.02, Impatience_and_Irritability=0.24, Sexual_Lust=-0.03, Fear=-0.02, Bitterness=0.01",
|
| 128 |
"adaln_nonzero": 38
|
| 129 |
},
|
| 130 |
{
|
| 131 |
+
"step": 10000,
|
| 132 |
"mode": "dual",
|
| 133 |
+
"caption": "A medium-quality recording of a female speaker discussing a topic with a slightly conversational tone. She sounds somewhat thoughtful and neutral in her emotional expression. The recording quality is decent, with no noticeable background noise.",
|
| 134 |
+
"prefix": "[cold, marked engaged, hesitant, mild excited, harsh voice, gentle warm-hearted, decent speech quality, discernible ecstatic, submissive, muted luxuriating]",
|
| 135 |
+
"transcript": "",
|
| 136 |
+
"adaln_summary": "Amusement=0.60, Elation=1.22, Pleasure_Ecstasy=1.00, Contentment=0.89, Thankfulness_Gratitude=0.12, Affection=1.07, Infatuation=0.03, Hope_Enthusiasm_Optimism=1.51, Triumph=-0.01, Pride=0.82, Interest=2.43, Concentration=0.78, Contemplation=0.65, Relief=0.37, Longing=0.07",
|
| 137 |
+
"adaln_nonzero": 39
|
| 138 |
}
|
| 139 |
]
|
| 140 |
}
|