clustex
Version:
Clustex is a lightweight text classification package designed to efficiently categorize text based on similarity metrics and learned token weights.
74 lines • 6.27 kB
JSON
{
"classifications": [
"spam",
"normal"
],
"data": [
{"text": "Вы выиграли миллион долларов! Получите его сейчас!", "classification": "spam"},
{"text": "Привет, как твои дела?", "classification": "normal"},
{"text": "Act fast! Limited-time offer on luxury watches!", "classification": "spam"},
{"text": "Hello, are you coming to the party tonight?", "classification": "normal"},
{"text": "¡Increíble descuento en productos electrónicos! Haz clic aquí.", "classification": "spam"},
{"text": "Hola, ¿quieres ir al cine este fin de semana?", "classification": "normal"},
{"text": "Gagnez de l'argent rapidement avec ce système magique!", "classification": "spam"},
{"text": "Salut! Tu veux prendre un café cet après-midi?", "classification": "normal"},
{"text": "限时优惠!点击这里获取您的奖金!", "classification": "spam"},
{"text": "你好!今天的天气真好!", "classification": "normal"},
{"text": "Jetzt sofort anmelden und kostenloses Geld erhalten!", "classification": "spam"},
{"text": "Hallo, hast du Lust auf ein Treffen morgen?", "classification": "normal"},
{"text": "Эксклюзивное предложение! Только сегодня получите приз!", "classification": "spam"},
{"text": "Как твои планы на выходные?", "classification": "normal"},
{"text": "Biggest sale of the year! Click to claim your reward!", "classification": "spam"},
{"text": "Would you like to grab lunch together?", "classification": "normal"},
{"text": "¡Hazte rico rápido con este sencillo truco!", "classification": "spam"},
{"text": "¿Quieres charlar un rato?", "classification": "normal"},
{"text": "Ajoutez votre numéro pour un accès spécial!", "classification": "spam"},
{"text": "J'adore les promenades en plein air!", "classification": "normal"},
{"text": "点击链接获取免费产品!", "classification": "spam"},
{"text": "我刚看完了一本书,太有趣了!", "classification": "normal"},
{"text": "Erhalten Sie sofortigen Zugang zu exklusiven Deals!", "classification": "spam"},
{"text": "Ich liebe es, neue Dinge zu lernen!", "classification": "normal"},
{"text": "Супер акция! Скидки до 90%, спешите!", "classification": "spam"},
{"text": "Сегодня был замечательный день!", "classification": "normal"},
{"text": "Claim your free iPhone now!", "classification": "spam"},
{"text": "I had a wonderful weekend!", "classification": "normal"},
{"text": "¡Recibe dinero por ver anuncios!", "classification": "spam"},
{"text": "Nos vemos mañana!", "classification": "normal"},
{"text": "Gagnez un voyage de luxe gratuitement!", "classification": "spam"},
{"text": "Profitez de cette belle journée!", "classification": "normal"},
{"text": "赢得免费比特币!", "classification": "spam"},
{"text": "我很期待周末!", "classification": "normal"},
{"text": "Exklusive Casino-Angebote nur für Sie!", "classification": "spam"},
{"text": "Ich habe eine neue Serie begonnen!", "classification": "normal"},
{"text": "Прямо сейчас получите деньги без вложений!", "classification": "spam"},
{"text": "Мне понравилось обсуждение сегодня!", "classification": "normal"},
{"text": "This is your last chance to claim rewards!", "classification": "spam"},
{"text": "Are you free for a call later?", "classification": "normal"},
{"text": "¡Grandes premios en efectivo te esperan!", "classification": "spam"},
{"text": "Disfruté la conversación contigo.", "classification": "normal"},
{"text": "Gagnez instantanément avec cette opportunité unique!", "classification": "spam"},
{"text": "J’ai découvert un nouveau café!", "classification": "normal"},
{"text": "点击这里获取独家优惠!", "classification": "spam"},
{"text": "我很喜欢这部电影!", "classification": "normal"},
{"text": "Jetzt anmelden und doppelten Gewinn erhalten!", "classification": "spam"},
{"text": "Ich genieße die frische Luft.", "classification": "normal"},
{"text": "Секретный метод получения богатства!", "classification": "spam"},
{"text": "Я люблю готовить новые блюда!", "classification": "normal"},
{"text": "Claim your cryptocurrency reward now!", "classification": "spam"},
{"text": "Let’s meet up tomorrow!", "classification": "normal"},
{"text": "Уникальная возможность увеличить доход!", "classification": "spam"},
{"text": "Прочитал интересную статью сегодня!", "classification": "normal"},
{"text": "Super discount! Limited-time offer!", "classification": "spam"},
{"text": "Would you like to go on a trip?", "classification": "normal"},
{"text": "¡Compra ahora y recibe un gran premio!", "classification": "spam"},
{"text": "Nos vemos en el café más tarde.", "classification": "normal"},
{"text": "Maximize your earnings with this secret method!", "classification": "spam"},
{"text": "I really enjoyed our discussion today.", "classification": "normal"},
{"text": "Gagnez un prix en vous inscrivant maintenant!", "classification": "spam"},
{"text": "J’ai découvert un restaurant incroyable!", "classification": "normal"},
{"text": "独家折扣,只限今天!", "classification": "spam"},
{"text": "我刚学会了一个新技能!", "classification": "normal"},
{"text": "Sichern Sie sich jetzt Ihr kostenloses Geschenk!", "classification": "spam"},
{"text": "Ich freue mich auf das Wochenende.", "classification": "normal"}
]
}