8:["$","div",null,{"className":"h-[calc(100vh-110px)] w-full pt-0 sm:h-auto","data-sentry-component":"Page","data-sentry-source-file":"page.tsx","children":["$","$L14",null,{"initialNeuron":{"modelId":"gpt-oss-20b","layer":"11-resid-post-aa","index":"74658","sourceSetName":"resid-post-aa","creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T04:31:51.554Z","maxActApprox":373.25,"hasVector":false,"vector":[],"vectorLabel":null,"vectorDefaultSteerStrength":10,"hookName":null,"topkCosSimIndices":[],"topkCosSimValues":[],"neuron_alignment_indices":[],"neuron_alignment_values":[],"neuron_alignment_l1":[],"correlated_neurons_indices":[],"correlated_neurons_pearson":[],"correlated_neurons_l1":[],"correlated_features_indices":[],"correlated_features_pearson":[],"correlated_features_l1":[],"neg_str":[" arr","(arr","_arr"," अर","\tarr","열","_feedback",".arr","Guests"," mengambil"],"neg_values":[-0.08526611328125,-0.07952880859375,-0.07952880859375,-0.0767822265625,-0.075927734375,-0.07464599609375,-0.07415771484375,-0.07391357421875,-0.07354736328125,-0.07177734375],"pos_str":[" Zugriff","中文版"," pretrained","ilingual"," NLP"," કરતાં"," prepor","ימון"," MODEL","ketøy"],"pos_values":[0.09136962890625,0.091064453125,0.08892822265625,0.08575439453125,0.0816650390625,0.079833984375,0.07879638671875,0.07867431640625,0.0777587890625,0.077392578125],"frac_nonzero":0.0000119620995504498,"freq_hist_data_bar_heights":[],"freq_hist_data_bar_values":[],"logits_hist_data_bar_heights":[],"logits_hist_data_bar_values":[],"decoder_weights_dist":[],"umap_cluster":null,"umap_log_feature_sparsity":null,"umap_x":null,"umap_y":null,"model":{"id":"gpt-oss-20b","displayNameShort":"GPT-OSS-20B","displayName":"GPT-OSS-20B","creatorId":"clkht01d40000jv08hvalcvly","tlensId":"openai/gpt-oss-20b","dimension":2880,"thinking":true,"visibility":"PUBLIC","defaultSourceSetName":null,"defaultSourceId":null,"defaultGraphSourceSetName":null,"inferenceEnabled":true,"instruct":true,"layers":24,"neuronsPerLayer":0,"createdAt":"$D2025-09-11T08:50:59.351Z","owner":"OpenAI","updatedAt":"$D2025-09-11T08:50:59.351Z","website":"https://huggingface.co/openai"},"lists":[],"creator":{"name":"bot-neuronpedia"},"source":{"id":"11-resid-post-aa","modelId":"gpt-oss-20b","hasDashboards":true,"inferenceEnabled":true,"saelensConfig":null,"saelensRelease":null,"saelensSaeId":null,"hfRepoId":"andyrdt/saes-gpt-oss-20b","hfFolderId":"resid_post_layer_11/trainer_0","visibility":"PUBLIC","defaultOfModelId":null,"setName":"resid-post-aa","creatorId":"clkht01d40000jv08hvalcvly","hasUmap":false,"hasUmapLogSparsity":false,"hasUmapClusters":false,"num_prompts":0,"num_tokens_in_prompt":1024,"dataset":"Various","notes":null,"cosSimMatchModelId":null,"cosSimMatchSourceId":null,"createdAt":"$D2025-09-11T08:50:59.351Z"},"sourceSet":{"modelId":"gpt-oss-20b","name":"resid-post-aa","hasDashboards":true,"allowInferenceSearch":true,"visibility":"PUBLIC","description":"Resid Post - 131k","type":"Resid Post - 131k","creatorName":"Andy Arditi","urls":["https://huggingface.co/andyrdt/saes-gpt-oss-20b"],"creatorEmail":null,"creatorId":"clkht01d40000jv08hvalcvly","releaseName":"gpt-oss-sae","hasGraphs":false,"graphEnabled":false,"similarityMatrixEnabled":false,"defaultOfModelId":null,"defaultGraphModelId":null,"defaultRange":1,"defaultShowBreaks":true,"showDfa":false,"showCorrelated":false,"showHeadAttribution":false,"showUmap":false,"createdAt":"$D2025-09-11T08:50:59.351Z"},"comments":[],"activations":[{"id":"kwz94oa4mn43l7zffu8exo6y","tokens":["<|start|>","system","<|message|>","You"," are"," Chat","GPT",","," a"," large"," language"," model"," trained"," by"," Open","AI",".\n","Knowledge"," cutoff",":"," ","202","4","-","06","\n","Current"," date",":"," ","202","5","-","09","-","18","\n\n","Reason","ing",":"," low","\n\n","#"," Valid"," channels",":"," analysis",","," commentary",","," final","."," Channel"," must"," be"," included"," for"," every"," message",".","<|end|>","<|start|>","user","<|message|>","Create"," a"," spam"," email"," detection"," model"," using"," Natural"," Language"," Processing"," techniques"," in"," Python",","," which"," should"," be"," able"," to"," identify"," and"," classify"," emails"," based"," on"," their"," text"," content"," as"," either"," spam"," or"," non","-sp","am"," with"," a"," high"," degree"," of"," accuracy","."," The"," model"," should"," utilize"," various"," NLP"," tools"," and"," techniques"," such"," as"," word"," embeddings",","," text"," preprocessing",","," and"," feature"," extraction",","," and"," should"," be"," trained"," on"," a"," large"," and"," diverse"," dataset"," of"," labeled"," spam"," and"," non","-sp","am"," emails","."," Additionally",","," the"," model"," should"," incorporate"," a"," range"," of"," evaluation"," metrics"," to"," measure"," its"," performance",","," including"," precision",","," recall",","," F","1","-score",","," and"," confusion"," matrix"," analysis","."," Finally",","," the"," model"," should"," be"," able"," to"," handle"," real","-world"," scenarios"," such"," as"," new"," and"," previously"," unseen"," types"," of"," spam"," emails",","," and"," should"," be"," designed"," to"," be"," scalable"," and"," maintain","able"," for"," future"," updates"," and"," improvements",".","<|end|>","<|start|>","assistant","<|channel|>","analysis","<|message|>","Need"," to"," provide"," a"," comprehensive"," guide"," with"," code",".","<|end|>","<|start|>","assistant","<|channel|>","final","<|message|>","##"," ","1","."," "," Overview","\n\n","Below"," you","’ll"," find"," a"," **","complete",","," end","‑","to","‑","end"," example","**"," that","\n\n","|"," Step"," |"," Description"," |\n","|","------","|","-------------","|\n","|"," **","Data","**"," |"," Download"," &"," combine"," the"," publicly","‑","available"," **","Spam","Ass","assin"," Public"," Corpus","**"," &"," a"," few"," non","‑","spam"," (","ham",")"," datasets","."," |\n","|"," **","Pre","‑","processing","**"," |"," Strip"," HTML",","," URLs",","," mentions",","," normalize"," case",","," remove"," stop","words",","," le","mmat","ise",","," etc","."," |\n","|"," **","Feature"," Engineer","**"," |"," ","1","️⃣"," TF","‑","ID","F"," +"," ","2","️⃣"," Ability"," to"," add"," word","‑","embedding"," vectors"," (","Fast","Text"," /"," G","lo","Ve"," or"," contextual"," *","B","ERT","*",")."," |\n","|"," **","Model","**"," |"," ","3","️⃣"," *","Hybrid","*"," model",":"," a"," **","text"," classification"," pipeline","**"," that"," can"," use"," any"," of"," the"," above"," features","."," Includes"," a"," logistic"," regression",","," X","G","Boost",","," and"," a"," transformer","‑","based"," fine","‑","t","uned"," *","Dist","il","B","ERT","*."," |\n","|"," **","Evaluation","**"," |"," Precision",","," Recall",","," F","1",","," Conf","usion"," matrix",","," ROC","‑","A","UC",","," PR","‑","A","UC","."," |\n","|"," **","Sc","al","ability","**"," |"," Uses"," **","p","andas","**,"," **","sc","ikit","‑","learn","**,"," **","H","ug","ging","Face"," Transformers","**,"," and"," **","ml","flow","**"," (","optional",")"," for"," reproduc","ibility","."," |\n","|"," **","Extend","ability","**"," |"," The"," script"," is"," modular",":"," you"," can"," plug"," in"," new"," embeddings",","," switch"," models",","," or"," retr","ain"," on"," fresh"," data"," with"," minimal"," code"," changes","."," |\n\n",">"," **","Note","**"," –"," Run"," the"," notebook"," in"," a"," GPU","‑","enabled"," environment"," (","Col","ab"," or"," a"," local"," machine",")"," if"," you"," plan"," to"," use"," transformer"," models","."," No"," GPU"," is"," required"," for"," the"," TF","‑","ID","F"," +"," X","G","Boost"," baseline",".\n\n","---\n\n","##"," ","2","."," "," Project"," Layout","\n\n","``","`\n","spam","_classifier","/\n","├","──"," data","/\n","│"," "," �","�","──"," spam","/\n","│"," "," �","�","──"," ham","/\n","│"," "," �","�","──"," raw","/"," "," #"," raw"," files"," downloaded"," here","\n","├","──"," models","/\n","│"," "," �","�","──"," saved","_models","/"," #"," pick","led"," models",","," embeddings",","," vector","izers","\n","├","──"," notebooks","/\n","│"," "," �","�","──"," spam","_classifier",".ip","yn","b","\n","├","──"," requirements",".txt","\n","�","�","──"," README",".md","\n","``","`\n\n","---\n\n","##"," ","3","."," "," Environment"," Setup"," (`","requirements",".txt","`",")\n\n","```","text","\n","p","andas","==","2",".","1",".","3","\n","numpy","==","1",".","26",".","4","\n","sc","ikit","-le","arn","==","1",".","4",".","1",".post","1","\n","x","g","boost","==","2",".","0",".","3","\n","n","ltk","==","3",".","8",".","1","\n","sp","acy","==","3",".","7",".","4","\n","beautiful","s","oup","4","==","4",".","12",".","3","\n","t","q","dm","==","4",".","66",".","2","\n","sentence","piece","==","0",".","1",".","99","\n","requests","==","2",".","31",".","0","\n","transform","ers","==","4",".","42",".","4","\n","torch","==","2",".","3",".","1","\n","datasets","==","2",".","20",".","0","\n","sc","ipy","==","1",".","13",".","1","\n","mat","plotlib","==","3",".","8",".","4","\n","se","ab","orn","==","0",".","13",".","2","\n","ml","flow","==","2",".","11",".","1"," "," #"," optional"," –"," for"," experiment"," tracking","\n","``","`\n\n","```","bash","\n","pip"," install"," -","r"," requirements",".txt","\n","python"," -","m"," sp","acy"," download"," en","_core","_web","_sm","\n","``","`\n\n","---\n\n","##"," ","4","."," "," Download"," &"," Prepare"," the"," Dataset","\n\n","###"," ","4",".","1"," "," Spam","Ass","assin"," Public"," Corpus"," "," (","spam"," emails",")\n\n","```","python","\n","import"," os",","," requests",","," tar","file",","," tqdm","\n\n","DATA","_DIR"," ="," \"","data","/raw","\"\n","os",".makedirs","(DATA","_DIR",","," exist","_ok","=True",")\n\n","spam","_url"," ="," \"","https","://","spam","ass","assin",".apache",".org","/","old","/public","cor","pus","/","200","302","28",".t","gz","\"\n","spam","_file"," ="," os",".path",".join","(DATA","_DIR",","," \"","200","302","28",".t","gz","\")\n\n","if"," not"," os",".path",".exists","(sp","am","_file","):\n"," "," print","(\"","Downloading"," spam"," corpus","...\")\n"," "," resp"," ="," requests",".get","(sp"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Chat","maxValue":373.25,"maxValueTokenIndex":861,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,23.5,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,32.8125,139.5,63.40625,54.8125,89.875,0,50.375,0,23.3125,68.0625,332.5,130.875,107.125,148.875,0,132.25,0,63.125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,161,371,266.75,144.375,373.25,237.75,260.5,107.6875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,90.6875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"ayo3js9cqbdkpwiqw28gbd4w","tokens":["<|start|>","system","<|message|>","You"," are"," Chat","GPT",","," a"," large"," language"," model"," trained"," by"," Open","AI",".\n","Knowledge"," cutoff",":"," ","202","4","-","06","\n","Current"," date",":"," ","202","5","-","09","-","18","\n\n","Reason","ing",":"," medium","\n\n","#"," Valid"," channels",":"," analysis",","," commentary",","," final","."," Channel"," must"," be"," included"," for"," every"," message",".","<|end|>","<|start|>","user","<|message|>","Write"," a"," Python"," script"," that"," uses"," Natural"," Language"," Processing"," techniques"," to"," analyze"," the"," sentiment"," (","positive",","," negative"," or"," neutral",")"," of"," comments"," posted"," on"," a"," specified"," You","Tube"," video","."," The"," script"," must"," be"," able"," to"," handle"," large"," volumes"," of"," comments",","," and"," accurately"," classify"," the"," sentiment"," of"," each"," comment"," based"," on"," factors"," such"," as"," the"," tone",","," emotion",","," and"," language"," used"," in"," the"," comments","."," Additionally",","," the"," script"," should"," be"," able"," to"," generate"," meaningful"," insights"," from"," the"," sentiment"," analysis",","," such"," as"," identifying"," common"," topics"," or"," themes"," that"," el","icit"," strong"," positive"," or"," negative"," reactions"," from"," viewers",".","<|end|>","<|start|>","assistant","<|channel|>","analysis","<|message|>","We"," need"," to"," produce"," a"," Python"," script"," that"," uses"," NLP"," techniques"," to"," analyze"," sentiment"," of"," You","Tube"," comments","."," Should"," handle"," large"," volumes",","," classify"," sentiment",","," extract"," insights",","," topics","."," Provide"," code",":"," fetching"," comments"," via"," You","Tube"," API",","," using"," sentiment"," analysis"," library"," (","like"," transformers",","," or"," Text","Blob",","," V","ADER",","," or"," N","LT","K",")."," For"," large"," volumes",","," we"," might"," use"," async"," or"," chunk","ing",","," maybe"," store"," results"," in"," Data","Frame",","," concurrency",".\n\n","The"," script"," also"," should"," identify"," common"," topics"," or"," themes"," that"," el","icit"," strong"," reactions",":"," could"," use"," L","DA"," topic"," modeling"," or"," bert"," embeddings"," clustering","."," Use"," spa","Cy"," for"," NLP",","," sc","ikit","-le","arn"," for"," L","DA",","," or"," use"," sentence","-transform","ers"," +"," clustering",".\n\n","We"," need"," to"," show"," how"," to"," accept"," video"," ID",","," fetch"," comments"," (","with"," Google"," API"," key",")."," Use"," youtube","-data","-api"," docs",".\n\n","Sent","iment"," classification",":"," For"," more"," accuracy",","," use"," transformers"," pipeline"," from"," hugging","face"," (","l","abeled",")."," Use"," \"","facebook","/b","art","-large","-m","n","li","\""," for"," sentiment"," analysis"," or"," \"","dist","il","bert","-base","-","unc","ased","-f","inet","uned","-s","st","-","2","-","english","\"."," For"," speed"," with"," many"," comments",","," can"," do"," batch"," inference",".\n\n","We"," should"," also"," highlight"," handling"," large"," volumes",":"," use"," batching",","," multiprocessing",","," or"," streaming",".\n\n","Also",","," for"," insights",":"," compute"," average"," sentiment",","," counts",","," identify"," topics"," using"," L","DA"," but"," label"," with"," sentiments",".\n\n","Provide"," full"," script"," with"," dependencies"," and"," instructions",".\n\n","The"," script"," should"," be"," modular",":"," functions"," for"," fetching"," comments",","," cleaning"," text",","," sentiment"," analysis",","," topic"," modeling",","," results",".\n\n","Also",","," potential"," issues",":"," You","Tube"," API"," quota","."," Use"," pagination",".\n\n","Also"," multi","-thread",".\n\n","Ok"," produce"," final"," answer"," with"," explanation"," then"," code",".\n\n","Let's"," draft"," script",".\n\n","We"," can"," use"," pandas",","," numpy",","," google","-api","-python","-client",","," tqdm",","," sentence","_transform","ers",","," sklearn",","," sp","acy",","," etc",".\n\n","We'll"," pip"," install"," the"," libs",".\n\n","Provide"," a"," main"," function",","," accept"," video"," ID"," and"," optional"," environment"," variables"," for"," API"," key",".\n\n","Let's"," include"," inference"," caching",".\n\n","Also"," mention"," GPU"," usage",":"," not"," necessary",".\n\n","Ok"," produce",".","<|end|>","<|start|>","assistant","<|channel|>","final","<|message|>","Below"," is"," a"," **","stand","‑","alone"," Python"," script","**"," that"," is"," ready"," to"," be"," dropped"," into"," a"," virtual"," environment",","," run"," on"," a"," laptop"," or"," a"," server",","," and"," will"," do"," the"," following",":\n\n","1","."," **","Pull"," all"," comments","**"," from"," a"," You","Tube"," video"," (","using"," the"," official"," You","Tube","‑","Data","‑","API"," V","3",")."," \n","2","."," **","Class","ify"," each"," comment","**"," as"," *","Positive","*,"," *","Negative","*"," or"," *","Neutral","*"," –"," we"," use"," the"," Hug","ging","‑","Face"," `","transform","ers","`"," pipeline"," that"," comes"," pre","‑","trained"," on"," the"," SST","‑","2"," dataset"," (","very"," fast"," and"," highly"," accurate"," for"," English",")."," \n","3","."," **","Summ","ar","ise"," the"," overall"," sentiment","**"," of"," the"," whole"," comment"," feed","."," \n","4","."," **","Extract"," “","strong","”"," reactions","**"," –"," comments"," that"," scored"," >"," ±","0",".","7"," in"," confidence"," –"," and"," run"," an"," uns","uper","vised"," topic"," model"," (","Lat","ent"," Dir","ich","let"," Allocation",")"," on"," them"," to"," discover"," what"," viewers"," are"," actually"," talking"," about","."," \n","5","."," **","Write"," a"," tidy"," CSV","**"," that"," contains"," every"," comment"," +"," its"," sentiment"," +"," confidence"," +"," topic"," label",","," plus"," a"," short"," MD","‑","style"," “","Insights","”"," file"," (`","ins","ights",".md","`)"," with"," human","‑","read","able"," results",".\n\n","---\n\n","##"," Why"," does"," this"," script"," work"," well"," on"," *","large","*"," volumes","?\n\n","|"," Feature"," |"," How"," it"," helps"," |\n","|","---------","|","--------------","|\n","|","**","Pagination","**"," |"," The"," API"," returns"," ","100"," comments"," at"," a"," time"," (","maximum",")."," The"," `","list","_comments","`"," generator"," keeps"," pulling"," pages"," until"," exhaustion","."," |\n","|","**","Batch"," inference","**"," |"," The"," `","transform","ers","`"," sentiment"," analyzer"," accepts"," a"," list"," of"," texts"," –"," we"," process"," ","32","‑","comment"," batches"," to"," fully"," utilise"," the"," GPU","/","CPU"," and"," keep"," memory"," usage"," modest","."," |\n","|","**","Streaming"," writing","**"," |"," Every"," batch"," is"," appended"," to"," the"," same"," Data","Frame"," and"," flushed"," to"," disk"," once"," a"," million"," comments"," are"," finished"," –"," keeps"," RAM"," small","."," |\n","|","**","Optional"," multiprocessing","**"," |"," The"," script"," is"," written"," so"," that"," you"," could"," swap"," the"," simple"," for","‑","loop"," call"," for"," `","con","current",".f","utures",".Process","Pool","Executor","`"," without"," changing"," any"," other"," logic","."," |\n","|","**","Rate","‑","limit"," safe","**"," |"," A"," tiny"," `","time",".sleep","(","0",".","05",")`"," keeps"," us"," within"," your"," per","‑","second"," quota",";"," just"," tweak"," if"," you"," hit"," errors","."," |\n\n","---\n\n","##"," Dependencies","\n\n","```","bash","\n","pip"," install"," google","-api","-python","-client"," tqdm"," transformers"," torch"," pandas"," sc","ikit","-le","arn"," sentence","-transform","ers"," sp","acy","\n","python"," -","m"," sp","acy"," download"," en","_core","_web","_sm","\n","``","`\n\n",">"," **","Tip","**"," ",":"," if"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Chat","maxValue":372.25,"maxValueTokenIndex":1011,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,60.34375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,47.53125,200.75,46.6875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,43.6875,0,0,0,0,0,0,0,0,0,0,0,0,90.0625,0,0,26.78125,0,0,0,0,0,28.0625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,48.25,271,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,32.375,0,0,0,0,0,0,0,0,0,0,0,0,45.46875,284.5,0,0,0,31.5,114.4375,371,263.75,154,372.25,167.375,274.75,96.1875,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"wz4f3rssyoyf6rc15y2q2rrx","tokens":["<|start|>","system","<|message|>","You"," are"," Chat","GPT",","," a"," large"," language"," model"," trained"," by"," Open","AI",".\n","Knowledge"," cutoff",":"," ","202","4","-","06","\n","Current"," date",":"," ","202","5","-","09","-","18","\n\n","Reason","ing",":"," low","\n\n","#"," Valid"," channels",":"," analysis",","," commentary",","," final","."," Channel"," must"," be"," included"," for"," every"," message",".","<|end|>","<|start|>","user","<|message|>","Use"," English"," Spa","Cy"," lib",","," find"," all"," tokens"," with"," only"," digits"," and"," all"," proper"," nouns"," (","PRO","PN",","," aka",","," personal"," nouns"," )"," in"," the"," text",","," count"," it"," and"," output"," it"," right","-al","igned"," in"," the"," HTML",".\n","For"," example",","," for"," the"," text"," \"","we"," need"," ","2"," tickets"," to"," Dublin",","," and"," ","1","/","2"," a"," spoon"," of"," milk","\""," read"," from"," the"," stdin"," (","use"," python"," my","program",".py"," <"," input",".txt"," >","output",".html"," )"," the"," program"," should"," output"," that"," \"","2","\""," was"," found"," twice"," (","output"," \"","2","\"),"," \"","1","\""," was"," found"," once"," (","output"," \"","1","\"),"," \"","D","ublin","\""," was"," found"," once"," (","output"," \"","1","\").","<|end|>","<|start|>","assistant","<|channel|>","analysis","<|message|>","Need"," to"," provide"," Python"," code"," explanation",".","<|end|>","<|start|>","assistant","<|channel|>","final","<|message|>","Below"," is"," a"," complete",","," ready","‑","to","‑","run"," Python"," script"," that"," does"," exactly"," what"," you"," described",".\n\n","```","python","\n","#!/","usr","/bin","/env"," python","3","\n","\"\"\"\n","my","program",".py","\n\n","Usage",":\n"," "," python"," my","program",".py"," <"," input",".txt"," >"," output",".html","\n\n","The"," script"," reads"," plain","‑","text"," from"," standard"," input",","," token","ises"," the"," text"," with"," Spa","Cy",",\n","counts",":\n\n","*"," every"," token"," that"," consists"," only"," of"," digits"," ("," e",".g","."," “","2","”,"," “","123","”,"," “","001","”"," )\n","*"," every"," token"," that"," is"," tagged"," as"," a"," *","proper"," noun","*"," (","PRO","PN",")\n\n","The"," results"," are"," printed"," as"," a"," minimal",","," right","‑","aligned"," HTML"," fragment",".\n\n","Dependencies","\n","------------\n","*"," spa","Cy"," ","3",".x","\n","*"," en","_core","_web","_sm"," (","or"," any"," other"," Spa","Cy"," English"," model"," that"," contains"," the","\n"," "," '","tag","ger","'"," component"," and"," can"," produce"," the"," UP","OS"," tags",")\n\n","Install"," them"," with",":\n"," "," pip"," install"," sp","acy","\n"," "," python"," -","m"," sp","acy"," download"," en","_core","_web","_sm","\n","\"\"\"\n\n","import"," sys","\n","import"," collections","\n","import"," sp","acy","\n\n","def"," main","():\n"," "," #"," Load"," the"," smallest"," English"," model"," (","change"," if"," you"," want"," a"," larger"," one",")\n"," "," n","lp"," ="," sp","acy",".load","(\"","en","_core","_web","_sm","\")\n\n"," "," #"," Read"," the"," whole"," input","\n"," "," text"," ="," sys",".stdin",".read","()\n\n"," "," #"," Process"," with"," Spa","Cy","\n"," "," doc"," ="," n","lp","(text",")\n\n"," "," #"," Coun","ters","\n"," "," digits"," ="," collections",".Counter","()\n"," "," prop","n"," ="," collections",".Counter","()\n\n"," "," for"," token"," in"," doc",":\n"," "," #"," Ignore"," tokens"," that"," are"," purely"," whitespace"," or"," punctuation","\n"," "," if"," token",".is","_space"," or"," token",".is","_p","unct",":\n"," "," continue","\n\n"," "," #"," -----"," ","1","."," only"," digits"," ----","-\n"," "," if"," token",".text",".is","digit","():"," "," #"," token"," contains"," *","only","*"," digits","\n"," "," digits","[token",".text","]"," +="," ","1","\n\n"," "," #"," -----"," ","2","."," proper"," noun"," ----","-\n"," "," #"," token",".tag","_"," contains"," the"," Universal"," POS"," tag"," (","UP","OS",")\n"," "," if"," token",".tag","_"," =="," \"","PRO","PN","\":\n"," "," prop","n","[token",".text","]"," +="," ","1","\n\n"," "," #"," --------"," Build"," HTML"," --------","\n"," "," html"," ="," []\n"," "," html",".append","(\"<","!","DOCTYPE"," html","><","html","><","head",">\")\n"," "," html",".append","(\"<","meta"," charset","='","utf","-","8","'>","\")\n"," "," html",".append","(\"<","style",">\")\n"," "," html",".append","(\""," "," body"," {","font","-family",":"," monos","pace",";"," white","-space",":"," pre",";","}\")\n"," "," html",".append","(\""," "," .","right"," {","text","-align",":right",";","}\")\n"," "," html",".append","(\"\")\n"," "," html",".append","(\"<","body",">","\")\n\n"," "," #"," Helper",":"," format"," one"," category","\n"," "," def"," format","_block","(title",","," counter","):\n"," "," html",".append","(f","\"<","h","2",">{","title","}\")\n"," "," if"," not"," counter",":\n"," "," html",".append","(\"<","p",">No"," matches"," found",".\")\n"," "," return","\n"," "," for"," token",","," count"," in"," sorted","(counter",".items","()):\n"," "," html",".append","(f","\"<","p"," class","='","right","'>{","token","}:"," {","count","}","\")\n\n"," "," format","_block","(\"","Digits"," only","\","," digits",")\n"," "," format","_block","(\"","Proper"," nouns"," (","PRO","PN",")\","," prop","n",")\n\n"," "," html",".append","(\"","\")\n\n"," "," sys",".stdout",".write","(\"\\","n","\".","join","(html","))\n\n","if"," __","name","__"," =="," \"__","main","__\":\n"," "," main","()\n","``","`\n\n","###"," How"," it"," works","\n\n","|"," Step"," |"," What"," happens"," |"," Key"," code"," |\n","|","------","|","--------------","|","----------","|\n","|"," **","Read"," input","**"," |"," The"," script"," reads"," all"," text"," from"," `","stdin","`."," |"," `","text"," ="," sys",".stdin",".read","()`"," |\n","|"," **","Token","ise"," with"," Spa","Cy","**"," |"," `","nl","p"," ="," sp","acy",".load","(...",");"," doc"," ="," n","lp","(text",")`"," |"," `","nl","p","`"," provides"," `","Token",".is","digit","`,"," `","Token",".tag","_","`,"," etc","."," |\n","|"," **","Count"," tokens","**"," |"," Two"," `","Counter","`"," objects"," are"," updated",":"," one"," for"," digit","‑","only"," tokens",","," one"," for"," `","PRO","PN","`."," |"," ```","python","\n","if"," token",".text",".is","digit","():\n"," "," digits","[token",".text","]"," +="," ","1","\n","if"," token",".tag","_"," =="," \"","PRO","PN","\":\n"," "," prop","n","[token",".text","]"," +="," ","1","```"," |\n","|"," **","Build"," right","‑"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Chat","maxValue":367.75,"maxValueTokenIndex":337,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,163.5,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,44.34375,0,0,0,0,0,0,0,0,0,0,0,106.0625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,42.53125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,97.0625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,30.71875,0,0,82,100.875,272,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,45.53125,99.25,303.25,62.09375,66,0,0,0,212.375,367.75,289,274.5,161.25,109.25,125.8125,121.4375,36.96875,263.5,149.625,233.625,104.6875,80.1875,55,0,37.96875,130.75,0,73.875,86.8125,75.75,61.0625,69,33.46875,0,0,0,0,0,0,57.59375,0,0,0,0,0,95.8125,259,0,84.25,0,0,51.28125,0,291.25,207.625,150,189.375,0,210.5,0,0,0,0,0,0,0,0,0,48.84375,234.25,39.09375,0,0,0,0,28.515625,151.5,200.25,128.375,125.125,262.25,98.0625,27.5,56.9375,71.625,30.546875,118.875,80.75,87.25,29.328125,114.625,0,145.375,55.375,0,126.875,227.75,158.25,0,0,0,188.875,52.90625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,95.75,83,0,120.0625,0,67.125,0,0,0,115.8125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,31.515625,0,0,0,0,0,0,0,0,0,0,126.9375,0,0,0,0,115.375,0,0,135.125,135,30.296875,0,0,0,0,78.1875,0,0,0,0,0,75.3125,0,43.59375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,39.5,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"sridaevfz8beqpl6mnub3s6j","tokens":["<|start|>","system","<|message|>","You"," are"," Chat","GPT",","," a"," large"," language"," model"," trained"," by"," Open","AI",".\n","Knowledge"," cutoff",":"," ","202","4","-","06","\n","Current"," date",":"," ","202","5","-","09","-","18","\n\n","Reason","ing",":"," medium","\n\n","#"," Valid"," channels",":"," analysis",","," commentary",","," final","."," Channel"," must"," be"," included"," for"," every"," message",".","<|end|>","<|start|>","user","<|message|>","Build"," a"," chatbot"," using"," Python"," and"," Natural"," Language"," Processing"," that"," can"," interact"," with"," users"," and"," provide"," helpful"," responses"," based"," on"," their"," input","."," The"," chatbot"," should"," be"," able"," to"," handle"," a"," wide"," range"," of"," topics"," and"," respond"," in"," a"," conversational"," and"," friendly"," tone","."," Consider"," implementing"," features"," such"," as"," sentiment"," analysis",","," keyword"," extraction",","," and"," context"," awareness"," to"," enhance"," the"," chatbot","'s"," abilities","."," The"," chatbot"," should"," also"," be"," able"," to"," respond"," appropriately"," to"," different"," levels"," of"," form","ality"," and"," adjust"," its"," language"," accordingly","."," Additionally",","," it"," should"," have"," error"," handling"," capabilities"," to"," gracefully"," handle"," unexpected"," input",".","<|end|>","<|start|>","assistant","<|channel|>","analysis","<|message|>","The"," user"," wants"," a"," comprehensive"," guide"," to"," build"," a"," chatbot"," in"," Python"," with"," NLP"," features",":"," conversation",","," sentiment"," analysis",","," keyword"," extraction",","," context"," awareness",","," handling"," form","ality"," levels",","," error"," handling","."," Provide"," code"," skeleton",","," explain"," libraries",","," structure","."," Maybe"," propose"," using"," open","-source"," libraries"," like"," spa","Cy",","," N","LT","K",","," transformers",","," text","blob",","," flair",","," or"," building"," on"," python","'s"," R","asa"," or"," hugging","face"," pipelines","."," Provide"," implementation"," steps",":"," data"," preparation",","," features",","," model"," selection",","," conversation"," flow",","," context"," management",","," response"," generation"," (","template"," or"," language"," model",","," e",".g",".,"," GPT","-","4"," via"," API"," or"," open","-source",")."," Provide"," sample"," code",":"," chatbot"," class",","," talk"," loop",","," sentiment"," analysis"," using"," Text","Blob"," or"," Vader",","," keyword"," extraction"," via"," RA","KE"," or"," spa","Cy","."," Adjust"," form","ality",":"," detect"," user"," style"," (","form","ality",")"," with"," a"," classifier"," or"," rule","-based",","," and"," choose"," response"," form","ality","."," Error"," handling",":"," try","-ex","cept",","," fallback"," responses",".\n\n","Should"," also"," mention"," usage"," of"," a"," knowledge"," base"," or"," retrieval","-based","."," Provide"," end","-to","-end"," example",".\n\n","Let's"," produce"," a"," long"," answer"," with"," sections"," and"," code",".","<|end|>","<|start|>","assistant","<|channel|>","final","<|message|>","##"," �","�"," Welcome"," to"," the"," “","Smart","‑","Chat","”"," Project","!\n\n","Below"," is"," a"," **","complete",","," end","‑","to","‑","end"," recipe","**"," for"," a"," Python"," chatbot"," that",":\n\n","|"," Feature"," |"," Implementation"," |\n","|","---","|","---","|\n","|"," **","Convers","ational"," &"," friendly"," tone","**"," |"," Mix"," of"," template"," &"," GPT","‑","style"," generation","."," |\n","|"," **","Sent","iment"," Analysis","**"," |"," [","V","ADER","](","https","://","github",".com","/c","jh","utto","/v","ader","Sent","iment",")"," (","fast",","," lex","icon","‑","based",")."," |\n","|"," **","Keyword"," Extraction","**"," |"," spa","Cy"," +"," RA","KE"," or"," the"," built","‑","in"," **","Key","B","ERT","**"," if"," you"," prefer"," B","ERT","‑","based","."," |\n","|"," **","Context"," Awareness","**"," |"," ","1","‑","turn"," or"," multi","‑","turn"," context"," stored"," in"," a"," small"," in","‑","memory"," U","DD","I","."," |\n","|"," **","Form","ality"," Adjustment","**"," |"," He","uristic"," +"," optional"," tiny"," classifier"," to"," toggle"," Pol","ite"," /"," Casual","."," |\n","|"," **","Error"," Handling","**"," |"," `","try","/","except","`,"," fall","backs",","," explicit"," “","I"," didn","’t"," understand","”"," prompt","."," |\n","|"," **","Ext","ens","ibility","**"," |"," Plug","‑","in"," slots"," for"," new"," intent"," detectors"," or"," retrieval"," engines","."," |\n\n",">"," **","Pro"," tip",":**"," For"," production","‑","grade"," bots"," you"," might"," want"," to"," wrap"," the"," entire"," flow"," in"," **","R","asa","**"," or"," **","Microsoft"," Bot"," Framework","**,"," but"," the"," skeleton"," below"," runs"," as"," a"," single"," script"," (","though"," feel"," free"," to"," split"," into"," modules",").\n\n","---\n\n","##"," �","�"," Dependencies","\n\n","```","bash","\n","pip"," install"," \\\n"," "," sp","acy"," \\\n"," "," nltk"," \\\n"," "," text","blob"," \\\n"," "," vader","Sent","iment"," \\\n"," "," transformers"," \\\n"," "," numpy"," \\\n"," "," python","-dot","env"," \\\n"," "," flask"," "," #"," optional",":"," expose"," as"," a"," web"," service","\n","``","`\n\n","```","python","\n","#"," Download"," spa","Cy"," and"," N","LT","K"," models"," (","run"," once",")\n","!","python"," -","m"," sp","acy"," download"," en","_core","_web","_sm","\n","import"," nltk","\n","n","ltk",".download","('","punkt","')\n","``","`\n\n",">"," **","Why"," these","?","**"," \n",">"," *"," **","spa","Cy","**"," –"," Fast"," token","isation"," +"," POS"," tagging"," +"," built","‑","in"," “","text","‑","similar","ity","”."," \n",">"," *"," **","V","ADER","**"," –"," Excellent"," for"," real","‑","time"," sentiment"," on"," informal"," chat","."," \n",">"," *"," **","Text","Blob","**"," –"," Quick"," noun","‑","phrase"," extraction"," if"," you"," don","’t"," want"," RA","KE","."," \n",">"," *"," **","H","ug"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Chat","maxValue":365.5,"maxValueTokenIndex":701,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,32.09375,205.75,0,0,0,51.65625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,113.0625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,23.78125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,74.3125,197.375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,61.90625,0,0,0,0,0,92,309.25,34.1875,0,95.0625,0,0,0,58.46875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,168.125,149.625,365.5,150,0,0,140.25,271.25,80.4375,0,30.953125,56.3125,0,0,77.0625,46.0625,79,314,229.625,76.6875,334.5,220.625,250,88.4375,26.875,122.9375,97.0625,0,122.8125,146.875,210.5,22.390625,53.53125,0,0,0,0,0,0,0,0,0,0,0,0,77.75,212.375,43.84375,71.8125,95.75,0,0,65.875,0,0,68,35.09375,0,113.8125,34.59375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,28.9375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"wacxv3cqx2e2l2orjqdh6wq2","tokens":["<|start|>","system","<|message|>","You"," are"," Chat","GPT",","," a"," large"," language"," model"," trained"," by"," Open","AI",".\n","Knowledge"," cutoff",":"," ","202","4","-","06","\n","Current"," date",":"," ","202","5","-","09","-","18","\n\n","Reason","ing",":"," medium","\n\n","#"," Valid"," channels",":"," analysis",","," commentary",","," final","."," Channel"," must"," be"," included"," for"," every"," message",".","<|end|>","<|start|>","user","<|message|>","Develop"," a"," Python"," script"," that"," can"," analyze"," the"," textual"," data"," of"," customer"," reviews"," and"," determine"," the"," most"," common"," location","-based"," complaints","."," The"," script"," should"," parse"," the"," text"," data"," to"," identify"," relevant"," keywords"," and"," phrases"," pertaining"," to"," concerns"," about"," specific"," areas"," or"," regions","."," Additionally",","," the"," script"," should"," be"," capable"," of"," identifying"," patterns"," and"," trends"," in"," the"," location","-based"," complaints"," across"," different"," customer"," reviews","."," Furthermore",","," the"," script"," should"," be"," able"," to"," generate"," a"," report"," summar","izing"," the"," key"," location","-based"," concerns"," and"," statistics"," about"," their"," frequency"," in"," the"," data"," set",".","<|end|>","<|start|>","assistant","<|channel|>","analysis","<|message|>","We"," need"," to"," develop"," a"," Python"," script","."," Requirements",":"," analyze"," textual"," data"," of"," customer"," reviews",","," determine"," most"," common"," location","-based"," complaints","."," Parse"," text"," to"," identify"," relevant"," keywords","/","phr","ases"," about"," concerns"," about"," specific"," areas","/","regions","."," Identify"," patterns","/tr","ends"," across"," reviews","."," Generate"," a"," report"," summar","izing"," key"," location","-based"," concerns"," and"," stats"," about"," frequency",".\n\n","Essential","ly",","," we"," need"," to"," load"," data",","," use"," NLP",":"," maybe"," spa","Cy"," for"," N","ER"," to"," detect"," location"," entities","."," Also"," define"," a"," set"," of"," complaint"," keywords",":"," negative"," words",","," or"," look"," for"," pairs",":"," [\"","bad","\","," \"","poor","\","," \"","problem","\","," \"","compl","aint","\","," \"","issue","\"]"," near"," location"," names","."," Use"," regex"," to"," find"," area"," names","."," Could"," also"," use"," fuzzy"," matching","."," We"," can"," use"," a"," pre","-trained"," NLP"," model"," like"," spa","Cy","'s"," '","en","_core","_web","_sm","'"," to"," identify"," G","PE"," entities","."," Then"," combine"," with"," complaint"," scores",":"," compute"," term"," frequencies"," of"," location"," entities","."," For"," patterns","/tr","ends",","," maybe"," time","-based","?"," But"," not"," needed"," –"," just"," across"," reviews",".\n\n","We'll"," produce"," a"," report",":"," possibly"," a"," markdown"," or"," text"," file"," listing"," top"," ","10"," locations"," and"," counts",","," breakdown"," of"," complaints",".\n\n","Need"," to"," provide"," a"," script"," structure",":"," import"," libs",":"," pandas",","," sp","acy",","," collections",".Counter",","," re","."," Provide"," placeholder"," data"," loading",":"," read"," CSV"," with"," '","review","_text","'"," column","."," Option","ally"," read"," from"," file","."," Provide"," a"," function"," to"," extract"," complaints"," by"," location",".\n\n","Algorithm",":"," For"," each"," review",","," use"," spa","Cy"," to"," process",";"," extract"," G","PE"," entities","."," For"," each"," entity",","," check"," if"," the"," review"," contains"," negative"," sentiment"," words"," or"," complaint"," keywords","."," We"," can"," also"," run"," sentiment"," analysis"," with"," Text","Blob"," or"," Vader","."," But"," easier",":"," check"," presence"," of"," negative"," words"," in"," proximity",".\n\n","Simpl","ify",":"," For"," each"," review",","," get"," all"," G","PE"," entities","."," If"," any"," \"","compl","aint"," keyword","\""," present",","," assume"," it's"," a"," complaint"," about"," that"," location","."," Count"," occurrences"," of"," each"," location",".\n\n","Also",","," we"," can"," identify"," patterns",":"," maybe"," grouping"," by"," month","/year"," if"," date"," column"," exists",".\n\n","Output",":"," generate"," a"," Markdown"," report"," summar","izing"," frequencies"," and"," maybe"," top"," ","5"," location"," concerns",".\n\n","Also",","," we"," could"," show"," bar"," chart"," using"," matplotlib",".\n\n","We"," need"," to"," produce"," a"," script",":"," may"," have"," main","()",".\n\n","Ensure"," to"," explain"," how"," to"," install"," dependencies",".\n\n","Let's"," craft"," the"," answer",":"," Provide"," script"," file"," with"," code",","," doc","string",","," maybe"," data"," assumption",".\n\n","Also"," explain"," steps",".\n\n","We"," might"," incorporate"," a"," small"," test"," dataset"," at"," the"," end"," for"," demonstration",".\n\n","Let's"," produce",".","<|end|>","<|start|>","assistant","<|channel|>","final","<|message|>","Below"," is"," a"," **","ready","‑","to","‑","run"," Python"," script","**"," that"," does"," exactly"," what"," you"," asked"," for",":\n\n","*"," Loads"," a"," data"," set"," of"," customer"," reviews"," (","CSV"," with"," a"," column"," called"," **","`","review","_text","`","**",").\n","*"," Uses"," **","spa","Cy","**"," to"," recognise"," *","location","*"," entities"," (","G","PE"," –"," “","geo","‑","polit","ical"," entity","”",").\n","*"," Looks"," for"," typical"," “","compl","aint","”"," words"," (`","poor",","," bad",","," issue",","," messed"," up",","," etc","."," …","`)"," around"," the","\n"," "," entity"," and"," counts"," how"," many"," times"," each"," location"," is"," tied"," to"," a"," complaint",".\n","*"," (","Optional",")"," If"," the"," data"," set"," contains"," a"," date"," column"," it"," can"," summar","ise"," trends"," over"," time",".\n","*"," Builds"," a"," **","Markdown"," report","**"," with"," the"," top","‑","N"," location"," complaints"," and","\n"," "," a"," quick"," bar","‑","plot"," using"," **","mat","plotlib","**",".\n\n","Feel"," free"," to"," tweak"," the"," list"," of"," complaint"," keywords",","," the"," number"," of"," top"," results",","," or"," to","\n","add"," more"," sophisticated"," NLP"," (","sent","iment"," models",","," rule","‑","based"," ge","olocation",","," etc",".).\n\n","---\n\n","```","python","\n","#!/","usr","/bin","/env"," python","3","\n","\"\"\"\n","customer","_location","_com","pl","aints",".py","\n","--------------------------------","\n\n","This"," script"," parses"," a"," CSV"," with"," customer"," reviews",","," extracts"," location","‑","based","\n","compl","aints",","," aggregates"," them",","," and"," produces"," a"," short"," Markdown"," report"," +"," a","\n","bar","‑","plot"," visual","ising"," the"," most"," frequent"," concerns",".\n\n","Dependencies","\n","------------\n","pip"," install"," pandas"," sp","acy"," matplotlib","\n","python"," -","m"," sp","acy"," download"," en","_core","_web","_sm","\n\n","File"," format","\n","------------\n","CSV"," with"," at"," least"," one"," column"," named"," ``","review","_text","``","."," \n","Optional"," columns"," that"," can"," be"," used"," are"," ``","review","_id","``"," and"," ``","review","_date","``",".\n","\"\"\"\n\n","import"," os","\n","import"," sys","\n","import"," re","\n","import"," argparse","\n","import"," pathlib","\n","import"," warnings","\n","from"," collections"," import"," Counter","\n","from"," datetime"," import"," datetime","\n\n","import"," pandas"," as"," pd","\n","import"," matplotlib",".pyplot"," as"," plt","\n","import"," sp","acy","\n","from"," sp","acy",".matcher"," import"," Phrase","Matcher","\n\n","#"," ----------------------------------------------------------------","-------\n","#"," ","1","."," Configure"," arguments","\n","#"," ----------------------------------------------------------------","-------","\n\n\n","def"," parse","_args","():\n"," "," parser"," ="," argparse",".Argument","Parser","(\n"," "," description","=\"","Analyse"," location","‑","based"," complaints"," from"," customer"," reviews",".\"\n"," "," )\n"," "," parser",".add","_argument"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Chat","maxValue":357,"maxValueTokenIndex":312,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,201.125,68.5,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,49.5,95,174,52.40625,0,245.75,184.125,253.875,50.6875,357,236.375,239.125,164.375,39.0625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,42.28125,225,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,167.375,32.71875,72.3125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,44.6875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,59.9375,259,32.53125,25.453125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,73.875,0,0,50.25,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,56.90625,295.5,0,0,0,0,44.59375,160.25,332,240.5,102.25,302.25,51.6875,239.625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,95.0625,0,0,0,0,0,0,0,84.125,278,75.625,0,0,182.125,0,0,0,0,0,0,0,0,0,0,0,0,29.84375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,197.125,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"j0e1wu1unc30jjpet3kpi1if","tokens":["<|start|>","system","<|message|>","You"," are"," Chat","GPT",","," a"," large"," language"," model"," trained"," by"," Open","AI",".\n","Knowledge"," cutoff",":"," ","202","4","-","06","\n","Current"," date",":"," ","202","5","-","09","-","18","\n\n","Reason","ing",":"," medium","\n\n","#"," Valid"," channels",":"," analysis",","," commentary",","," final","."," Channel"," must"," be"," included"," for"," every"," message",".","<|end|>","<|start|>","user","<|message|>","Create"," a"," Python"," program"," that"," utilizes"," natural"," language"," processing"," techniques"," to"," identify"," patterns"," in"," a"," given"," text"," dataset","."," The"," program"," should"," be"," able"," to"," detect"," and"," extract"," patterns"," such"," as"," sentence"," structure",","," frequently"," used"," words"," and"," phrases",","," and"," overall"," language"," style","."," Additionally",","," the"," program"," should"," provide"," visual","izations"," or"," other"," means"," to"," help"," identify"," and"," interpret"," patterns"," within"," the"," text"," data",".","<|end|>","<|start|>","assistant","<|channel|>","analysis","<|message|>","We"," need"," to"," produce"," a"," Python"," program"," that"," uses"," NLP"," to"," identify"," patterns",":"," sentence"," structure",","," frequently"," used"," words","/","phr","ases",","," overall"," language"," style","."," Should"," provide"," visual","izations","."," So"," we"," can"," create"," a"," script"," using"," nltk",","," sp","acy",","," gens","im",","," etc","."," Provide"," code","."," Also"," demonstration"," with"," sample"," dataset","?"," Provide"," instructions","."," Should"," include"," generating"," word"," clouds",","," bar"," charts",","," frequency"," distributions",","," n","-","gram"," analysis","."," Also"," parse"," sentence"," parse"," tree"," to"," detect"," structure","."," Use"," spa","Cy","'s"," dependency"," parse","."," Provide"," styl","ometric"," features",":"," average"," sentence"," length",","," POS"," tag"," distribution",".\n\n","We"," need"," to"," produce"," a"," program","."," Let's"," consider",":\n\n","-"," Load"," text"," data"," (","list"," of"," texts",")"," from"," file"," or"," directory",".\n\n","-"," Pre","process",":"," tokenize",","," remove"," stop","words",","," punctuation",".\n\n","-"," Compute"," word"," frequencies"," and"," phrase"," n","-","gram"," frequencies"," (","2","-","grams",","," ","3","-","grams",")."," Use"," collections",".Counter"," or"," nltk",".ng","r","ams",".\n\n","-"," Sentence"," structure",":"," Use"," spa","Cy","'s"," parse"," tree"," to"," maybe"," collect"," dependency"," tree"," sequences"," or"," POS"," tag"," sequences","."," Show"," distribution"," of"," sentence"," length"," (#"," words","),"," parse"," types",".\n\n","-"," Overall"," language"," style",":"," lexical"," diversity"," (","type","/token"," ratio","),"," average"," sentence"," length",","," punctuation"," usage",","," etc","."," Use"," styl","ometric"," metrics",".\n\n","-"," Visual","izations",":"," word"," cloud",","," bar"," charts"," for"," most"," frequent"," words","/","phr","ases",","," sentence"," length"," distribution",","," POS"," distribution"," bar"," chart","."," Possibly"," plot"," parse"," patterns"," using"," matplotlib",".\n\n","-"," Provide"," interactive"," notes",".\n\n","We"," might"," write"," code"," using"," J","upyter"," notebook"," style"," but"," requested"," as"," program","."," Provide"," dependencies",":"," sp","acy",","," nltk",","," word","cloud",","," matplotlib",","," seab","orn","."," Use"," sp","acy"," english"," model"," \"","en","_core","_web","_sm","\"."," Provide"," code"," for"," installation",".\n\n","We"," can"," create"," a"," class"," Text","Pattern","Analyzer"," with"," methods",":\n\n","-"," __","init","__(","self",","," texts",")\n","-"," compute","_word","_f","requencies","\n","-"," compute","_ng","ram","_f","requencies","\n","-"," compute","_sentence","_structure","\n","-"," compute","_style","_metrics","\n","-"," visualize","()\n\n","We"," need"," to"," show"," at"," end"," sample"," output",".\n\n","We"," can"," optionally"," include"," a"," function"," to"," analyze"," text"," dataset"," file",".\n\n","Thus"," I"," will"," provide"," the"," python"," script"," with"," comments",".\n\n","Also"," provide"," an"," example"," dataset",":"," can"," use"," placeholder"," file"," or"," simple"," sample",".\n\n","Plus"," results",".\n\n","Focus"," on"," clarity",".\n\n","Let's"," start",".\n\n","We'll"," deliver"," a"," Python"," file",".\n\n","Also"," instructions"," for"," running",".\n\n","Given"," the"," instructions",","," produce"," final"," answer",":"," a"," Python"," program",";"," show"," features",".\n\n","Let's"," write"," code",":"," at"," the"," top"," import"," statements",";"," define"," functions",";"," at"," main"," create"," an"," instance",";"," call"," methods"," and"," plot"," using"," matplotlib","/se","ab","orn",".\n\n","Because"," the"," user"," didn't"," specify"," environment",","," we"," will"," assume"," CPU","-cap","able"," environment",".\n\n","We'll"," reference"," that"," the"," user"," may"," pip"," install"," necessary"," packages"," if"," not"," already",".\n\n","Also"," we"," might"," integration"," with"," word","cloud",".\n\n","Ok"," produce",".","<|end|>","<|start|>","assistant","<|channel|>","final","<|message|>","Below"," is"," a"," **","ready","‑","to","‑","run"," Python"," script","**"," (`","text","_pattern","_an","alyzer",".py","`)"," that"," does"," the"," following",":\n\n","1","."," Loads"," a"," text"," dataset"," (","either"," a"," single"," `.","txt","`"," file"," or"," all"," `.","txt","`"," files"," from"," a"," folder",")."," \n","2","."," Performs"," standard"," NLP"," preprocessing"," (","token","isation",","," le","mm","atisation",","," stop","‑","word"," removal",","," etc",".)."," \n","3","."," Computes"," a"," range"," of"," “","semantic"," &"," stylist","ic","”"," metrics"," –"," \n"," "," *"," Frequency"," lists"," of"," words"," and"," multi","‑","word"," phrases"," (","n","‑","grams",")."," \n"," "," *"," Sentence","‑","structure"," features"," (","POS","‑","tag"," sequence",","," dependency"," sub","‑","trees",","," average"," sentence"," length",")."," \n"," "," *"," Sty","list","ic"," fingerprints"," (","lex","ical"," diversity",","," average"," words","/s","entence",","," punctuation"," density",","," etc",".)."," \n","4","."," Generates"," visual","isations"," that"," help"," you"," explore"," and"," interpret"," the"," patterns","."," \n","5","."," Saves"," all"," results"," to"," a"," `","results","/","`"," folder"," so"," you"," can"," inspect"," them"," later",".\n\n",">"," **","Dependencies","**"," \n",">"," `","pip"," install"," sp","acy"," nltk"," word","cloud"," matplotlib"," seab","orn"," pandas"," tqdm","`\n\n",">"," **","Model","**"," \n",">"," `","python"," -","m"," sp","acy"," download"," en","_core","_web","_sm","`\n\n","---\n\n","##"," File",":"," `","text","_pattern","_an","alyzer",".py","`\n\n","```","python","\n","#!/","usr","/bin","/env"," python","\n","#"," -*-"," coding",":"," utf","-","8"," -*-\n\n","\"\"\"\n","text","_pattern","_an","alyzer",".py","\n\n","A"," small",","," self","‑","contained"," NLP"," utility"," that"," reads"," a"," text"," corpus",","," extracts"," linguistic","\n","patterns"," (","word","/","phrase"," frequencies",","," sentence"," structure",","," styl","ometric"," fingerprints",")\n","and"," produces"," visual","isations"," for"," quick"," interpretation",".\n\n","Author",":"," "," Chat","GPT"," (","Open","AI",")\n","Date",":"," "," ","202","5","‑","08","‑","08","\n","\"\"\"\n\n","import"," os","\n","import"," glob","\n","import"," json","\n","import"," argparse","\n","import"," pathlib","\n","from"," collections"," import"," Counter",","," defaultdict","\n","from"," typing"," import"," List",","," Tuple",","," Dict","\n\n","import"," numpy"," as"," np","\n","import"," pandas"," as"," pd","\n","import"," matplotlib",".pyplot"," as"," plt","\n","import"," seab","orn"," as"," sns","\n","from"," tqdm"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Chat","maxValue":357,"maxValueTokenIndex":443,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,81.5625,0,0,219.5,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,76.375,204.5,91.6875,0,26.359375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,39.09375,0,0,0,0,0,0,0,0,0,46.09375,173.875,45.84375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,88.4375,306.25,0,67.625,0,0,0,0,0,0,0,0,0,0,32.46875,244.875,168.75,315.25,246,43.78125,357,227.75,241.625,107.9375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,32,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,22.453125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,33.84375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,118.6875,0,0,0,39.15625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,103.5625,296,101.6875,0,0,0,24.65625,0,0,0,0,0,0,210,81.1875,57.65625,141.875,132,0,0,81.5,115.5625,316.25,230.125,75.0625,293.5,109.9375,244.5,55.96875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,61.34375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,56.0625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"mrs4doicg9twdo8svw8kuppb","tokens":["<|start|>","system","<|message|>","You"," are"," Chat","GPT",","," a"," large"," language"," model"," trained"," by"," Open","AI",".\n","Knowledge"," cutoff",":"," ","202","4","-","06","\n","Current"," date",":"," ","202","5","-","09","-","18","\n\n","Reason","ing",":"," low","\n\n","#"," Valid"," channels",":"," analysis",","," commentary",","," final","."," Channel"," must"," be"," included"," for"," every"," message",".","<|end|>","<|start|>","user","<|message|>","im","prove"," my"," preprocessing"," function",","," there"," are"," a"," lot"," of"," meaning","full"," words"," like"," \"","aa","ah","g","\""," or"," \"","zz","zz","zz","\""," in"," my"," text",":\n","stop","_words"," ="," set","(stop","words",".words","('","english","'))\n","lemm","at","izer"," ="," Word","Net","L","em","mat","izer","()\n\n","def"," preprocess","_text","(text","):\n"," "," #"," Remove"," HTML"," tags","\n"," "," text"," ="," re",".sub","(r","'<","[^",">","]*",">',"," '',"," text",")\n"," "," #"," Remove"," special"," characters"," and"," punctuation","\n"," "," text"," ="," re",".sub","(r","'","[^","a","-z","A","-Z","\\s","]',"," '',"," text",")\n"," "," #"," Convert"," to"," lowercase","\n"," "," text"," ="," text",".lower","()\n"," "," #"," Token","ization"," and"," le","mmat","ization","\n"," "," tokens"," ="," [","lemm","at","izer",".le","mmat","ize","(word",")"," for"," word"," in"," text",".split","()"," if"," word"," not"," in"," stop","_words","]\n"," "," return"," '"," '.","join","(tokens",")","<|end|>","<|start|>","assistant","<|channel|>","analysis","<|message|>","Need"," to"," suggest"," improvements",":"," handle"," n","-","grams",","," noise",","," punctuation",","," contractions",","," emojis",","," profanity","."," Use"," spa","Cy",","," handle"," special"," words","."," Use"," regex"," to"," collapse"," repeated"," chars","."," Provide"," code",".","<|end|>","<|start|>","assistant","<|channel|>","final","<|message|>","Below"," is"," a"," **","fully","‑","comment","ed",","," production","‑","ready"," implementation","**"," that"," keeps"," all"," the"," ideas"," you"," already"," have"," (","HTML"," removal",","," non","‑","alpha"," stripping",","," stop","‑","word"," filtering"," &"," le","mmat","ization",")"," but"," adds"," a"," number"," of"," additional"," linguistic",","," statistical"," and"," robustness"," improvements"," that"," will"," dramatically"," increase"," the"," *","meaning","fulness","*"," of"," the"," tokens"," you"," obtain","."," \n\n","Feel"," free"," to"," cherry","‑","pick"," the"," parts"," you"," need",";"," the"," whole"," function"," is"," modular"," so"," you"," can"," drop"," in"," or"," out"," the"," tricks"," that"," best"," suit"," your"," corpus",".\n\n","```","python","\n","#"," ----------------------------------------------------------------","--\n","#"," "," �","�","─"," Imports"," �","�","────────────────","────────────────","────────────────","────","─","\n","#"," ----------------------------------------------------------------","--\n","import"," re","\n","import"," string","\n","from"," collections"," import"," Counter","\n\n","import"," nltk","\n","import"," sp","acy","\n\n","#"," Make"," sure"," the"," required"," N","LT","K"," resources"," are"," downloaded","\n","n","ltk",".download","('","stop","words","')\n","n","ltk",".download","('","word","net","')\n","n","ltk",".download","('","om","w","-","1",".","4","')\n\n","#"," ----------------------------------------------------------------","--\n","#"," "," �","�","─"," ","1","️⃣"," "," Initial","isation"," of"," reusable"," objects"," �","�","────────────────","──","─","\n","#"," ----------------------------------------------------------------","--\n","#"," ","1","."," Stop","‑","words"," –"," you"," can"," extend"," or"," fine","‑","t","une"," this"," list"," later",".\n","STOP","_WORD","S"," ="," set","(n","ltk",".c","orpus",".stop","words",".words","('","english","'))\n\n","#"," ","2","."," Word","Net"," le","mmat","izer"," –"," a"," lightweight"," fallback","\n","WN","_LE","MM","AT","IZER"," ="," nltk",".st","em",".Word","Net","L","em","mat","izer","()\n\n","#"," ","3","."," spa","Cy"," (","en","_core","_web","_sm",")"," –"," the"," best"," of"," both"," worlds",":"," fast"," token","isation","\n","#"," "," +"," robust"," le","mmat","ization"," +"," POS"," tagging","\n","#"," "," If"," you"," don't"," have"," it"," installed",":"," python"," -","m"," sp","acy"," download"," en","_core","_web","_sm","\n","nl","p","_sp","acy"," ="," sp","acy",".load","(\"","en","_core","_web","_sm","\","," disable","=[\"","ner","\","," \"","text","cat","\"])\n\n","#"," ","4","."," Characters"," that"," usually"," signal"," “","noise","”"," (","symbols",","," emojis",","," etc",".)\n","EM","O","JI","_REGEX"," ="," re",".compile","(\n"," "," \"[","\"\n"," "," \"\\","U","000","1","F","600","-\\","U","000","1","F","64","F","\""," "," #"," emot","icons","\n"," "," \"\\","U","000","1","F","300","-\\","U","000","1","F","5","FF","\""," "," #"," symbols"," &"," pict","ographs","\n"," "," \"\\","U","000","1","F","680","-\\","U","000","1","F","6","FF","\""," "," #"," transport"," &"," map"," symbols","\n"," "," \"\\","U","000","1","F","1","E","0","-\\","U","000","1","F","1","FF","\""," "," #"," flags","\n"," "," \"","]+","\",\n"," "," flags","=re",".UN","ICODE",",\n",")\n\n","#"," ----------------------------------------------------------------","--\n","#"," "," �","�","─"," ","2","️⃣"," "," Helper"," utilities"," �","�","────────────────","────────────────","────","──","─","\n","#"," ----------------------------------------------------------------","--\n","def"," clean","_html","(text",":"," str",")"," ->"," str",":\n"," "," \"\"\"","Remove"," any"," HTML","/XML"," tags",".\"\"\"\n"," "," return"," re",".sub","(r","\"<","[^",">","]*",">\","," \"\","," text",")\n\n\n","def"," remove","_em","ojis","(text",":"," str",")"," ->"," str",":\n"," "," \"\"\"","Drop"," all"," emoji"," /"," pict","ographic"," unicode"," characters",".\"\"\"\n"," "," return"," EM","O","JI","_REGEX",".sub","(\"\","," text",")\n\n\n","def"," collapse","_re","peated","_chars","(text",":"," str",","," max","_seq",":"," int"," ="," ","3",")"," ->"," str",":\n"," "," \"\"\"\n"," "," Collapse"," sequences"," of"," repeated"," characters"," (","e",".g","."," \"","so","ooo","\""," →"," \"","soo","\").\n"," "," If"," a"," word"," has"," more"," than"," *","max"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Chat","maxValue":356.75,"maxValueTokenIndex":544,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,115.5625,87.875,0,0,0,0,0,36.9375,0,0,29.65625,0,0,0,28.0625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,79.5625,195.875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,23.828125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,40.21875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,145.125,153.25,25.5,83.9375,269.5,66.25,33.8125,110.25,104.5,235.25,106.1875,38.0625,0,164.625,209.875,116.625,174.25,65.5,0,114.625,135.625,225.625,34.625,90.375,75.25,0,70,146.125,182,0,39.5625,58.96875,0,29.28125,60.09375,185.625,0,40.34375,65.8125,25.546875,0,55.1875,45.1875,41.3125,0,0,0,0,0,0,0,0,0,0,0,0,39.21875,64.1875,27.359375,0,0,0,0,0,0,0,0,0,27.1875,49.71875,0,0,30.71875,35.1875,0,24.828125,26.171875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,22.578125,52.34375,0,78.6875,0,86.125,0,54.40625,56.125,0,0,0,28.34375,0,0,35.78125,0,33.03125,0,0,44.53125,33.15625,0,0,0,0,0,0,0,0,0,26.03125,81.6875,29.515625,39.78125,0,0,0,0,50.1875,0,0,30.40625,118.125,22.453125,62.6875,92.25,292.25,102.9375,222.25,356.75,286.25,258,138,85.125,103,47.96875,29.875,0,0,59.78125,97.3125,0,27.953125,27.8125,37.40625,39.4375,53.5625,29.375,0,0,0,89.1875,0,0,47.3125,58,124.875,51.34375,55.8125,23.890625,112.3125,180,72.8125,23.859375,0,0,46.84375,51.0625,329.25,209.75,59.03125,167.875,0,237.75,51.8125,53.8125,129.25,26.15625,93.0625,57.40625,0,163.875,248.125,187.25,0,0,0,194.125,186.875,47.15625,87.6875,0,0,81.75,0,22.984375,42.40625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,29.015625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"x3iowrbqwgqby15s9d7nm7l7","tokens":["<|start|>","system","<|message|>","You"," are"," Chat","GPT",","," a"," large"," language"," model"," trained"," by"," Open","AI",".\n","Knowledge"," cutoff",":"," ","202","4","-","06","\n","Current"," date",":"," ","202","5","-","09","-","18","\n\n","Reason","ing",":"," low","\n\n","#"," Valid"," channels",":"," analysis",","," commentary",","," final","."," Channel"," must"," be"," included"," for"," every"," message",".","<|end|>","<|start|>","user","<|message|>","Entr","ene"," el"," modelo"," con"," el"," siguiente"," código",":"," import"," torch","\n","import"," torch",".nn"," as"," nn","\n","import"," time","\n","from"," torch","text",".datasets"," import"," Penn","Tree","bank","\n","from"," torch","text",".data",".functional"," import"," to","_map","_style","_dataset","\n","from"," torch","text",".data",".utils"," import"," get","_token","izer","\n","from"," torch","text",".v","ocab"," import"," build","_vocab","_from","_iterator","\n","from"," torch",".utils",".data"," import"," Data","Loader","\n\n","#"," ","1","."," Def","inir"," el"," modelo","\n","class"," Transformer","Model","(nn",".Module","):\n"," "," def"," __","init","__(","self",","," vocab","_size",","," d","_model",","," n","head",","," num","_layers","):\n"," "," super","(","Transformer","Model",","," self",").__","init","__()\n"," "," self",".embedding"," ="," nn",".","Embedding","(v","ocab","_size",","," d","_model",")\n"," "," self",".transform","er"," ="," nn",".","Transformer","(d","_model",","," n","head",","," num","_layers",")\n"," "," self",".fc"," ="," nn",".Linear","(d","_model",","," vocab","_size",")\n\n"," "," def"," forward","(self",","," src",","," tgt","):\n"," "," src"," ="," self",".embedding","(src",")\n"," "," tgt"," ="," self",".embedding","(t","gt",")\n"," "," x"," ="," self",".transform","er","(src",","," tgt",")\n"," "," x"," ="," self",".fc","(x",")\n"," "," return"," x","\n\n\n","#"," ","2","."," Prepar","ar"," datos","\n","train","_data","_raw"," ="," to","_map","_style","_dataset","(P","enn","Tree","bank","(split","='","train","'))\n","token","izer"," ="," get","_token","izer","(\"","sp","acy","\","," \"","en","_core","_web","_sm","\")\n\n","#"," Ag","regar"," tokens"," especiales"," (","UNK"," y"," PAD",")"," al"," vocab","ulario","\n","special","s"," ="," ['","<","unk",">","','","<","pad",">","']\n","v","ocab"," ="," build","_vocab","_from","_iterator","((","token","izer","(y",")"," for"," y"," in"," train","_data","_raw","),"," specials","=s","pecial","s",")\n","v","ocab",".set","_default","_index","(v","ocab","['","<","unk",">","'])\n\n","#"," Div","idir"," los"," datos"," en"," conjuntos"," de"," entrenamiento"," y"," valid","ación","\n","train","_ratio"," ="," ","0",".","8","\n","train","_data","_size"," ="," int","(len","(train","_data","_raw",")"," *"," train","_ratio",")\n","train","_data"," ="," train","_data","_raw","[:","train","_data","_size","]\n","valid","_data"," ="," train","_data","_raw","[","train","_data","_size",":","]\n\n\n","#"," ","3","."," Entr","enar"," el"," modelo","\n","def"," generate","_pairs","(tokens",","," shift","=","1","):\n"," "," source"," ="," [","tokens","[i","]"," for"," i"," in"," range","(","0",","," len","(tokens",")"," -"," shift",")]\n"," "," target"," ="," [","tokens","[i","]"," for"," i"," in"," range","(","shift",","," len","(tokens","))]\n"," "," return"," source",","," target","\n\n","def"," tokenize","_data","(text",","," max","_seq","_len","=None","):\n"," "," tokens"," ="," tokenizer","(text",")","[:","max","_seq","_len","]\n"," "," return"," torch",".tensor","([","v","ocab","[token","]"," if"," token"," in"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Chat","maxValue":351.75,"maxValueTokenIndex":302,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,33.21875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,42.0625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,56.1875,50.9375,0,173.5,58.75,88.75,62.90625,351.75,259,234.625,34.09375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,35.53125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,46.65625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"s3zh44h1c9rnnr5sn5rvrzdx","tokens":["<|start|>","system","<|message|>","You"," are"," Chat","GPT",","," a"," large"," language"," model"," trained"," by"," Open","AI",".\n","Knowledge"," cutoff",":"," ","202","4","-","06","\n","Current"," date",":"," ","202","5","-","09","-","18","\n\n","Reason","ing",":"," medium","\n\n","#"," Valid"," channels",":"," analysis",","," commentary",","," final","."," Channel"," must"," be"," included"," for"," every"," message",".","<|end|>","<|start|>","user","<|message|>","Build"," a"," Python"," program"," that"," reads"," input"," from"," a"," file"," in"," a"," specific"," format"," (","spec","ify"," the"," format","),"," and"," performs"," various"," text"," analysis"," operations"," on"," it",","," such"," as"," word"," count",","," frequency"," analysis",","," sentiment"," analysis",","," and"," named"," entity"," recognition","."," The"," program"," should"," output"," the"," analysis"," results"," to"," a"," separate"," file"," or"," display"," them"," on"," the"," console","."," The"," program"," should"," also"," have"," error"," handling"," and"," be"," able"," to"," handle"," large"," input"," files"," efficiently",".","<|end|>","<|start|>","assistant","<|channel|>","analysis","<|message|>","We"," need"," to"," build"," a"," python"," program"," with"," read"," from"," file"," format",","," operations",":"," word"," count",","," frequency"," analysis",","," sentiment"," analysis",","," Named"," Entity"," Recognition","."," Output"," results","."," Should"," have"," error"," handling",","," handle"," large"," input"," efficiently","."," Provide"," code"," example",","," explanation",","," instructions","."," Also"," probably"," need"," to"," use"," libraries"," like"," nltk",","," Text","Blob"," or"," V","ADER"," for"," sentiment",","," spa","Cy"," for"," N","ER","."," For"," large"," files",","," we"," should"," process"," line"," by"," line"," or"," chunk"," by"," chunk","."," Use"," memory"," efficient"," counting",":"," streaming","."," We"," should"," implement"," functions",":"," read","_file",","," word","_count",","," frequency","_analysis",","," sentiment","_analysis",","," ner","_analysis","."," Show"," file"," formats",":"," e",".g",".,"," plain"," text"," file","."," Provide"," a"," sample"," config","."," Provide"," a"," README"," style","."," Provide"," code"," snippet"," with"," usage",".\n\n","Also"," include"," requirements",".txt"," file","."," Provide"," the"," actual"," code",".\n\n","We"," need"," to"," make"," sure"," to"," not"," import"," heavy"," modules"," all"," at"," once",";"," can"," laz","ily"," import","."," Provide"," a"," '","main","'"," guard","."," Provide"," robust"," exception"," handling","."," On"," missing"," dependencies",","," show"," message","."," Show"," that"," we"," can"," support"," large"," by"," reading"," chunk"," and"," updating"," stats","."," For"," frequency",","," we"," will"," use"," collections",".Counter"," but"," updating"," as"," we"," go",".\n\n","For"," sentiment",","," if"," large"," text",","," can"," use"," V","ADER"," on"," each"," chunk","."," Sum"," scores",".\n\n","For"," N","ER",","," spa","Cy"," model",";"," but"," spa","Cy"," may"," require"," large"," memory",";"," we"," can"," use"," '","en","_core","_web","_sm","'."," For"," large"," input",","," might"," increase"," memory"," for"," Doc"," objects",";"," can"," iterate"," in"," streaming",".\n\n","We"," need"," to"," share"," the"," entire"," solution",".\n\n","So"," final"," answer",":"," a"," self","-contained"," Python"," script"," with"," explanation",","," requirements",","," sample"," usage",","," error"," handling",","," optimized","."," Provide"," both"," code"," and"," explanation",".\n\n","Let's"," craft"," a"," thorough"," answer",".","<|end|>","<|start|>","assistant","<|channel|>","final","<|message|>","Below"," is"," a"," **","complete",","," ready","‑","to","‑","run"," Python"," program","**"," that","\n\n","*"," reads"," a"," plain","‑","text"," file"," that"," is"," optionally"," split"," into"," “","paragraph","s","”"," (","empty"," line"," ="," new"," paragraph","),"," \n","*"," streams"," the"," file"," so"," that"," even"," very"," large"," documents"," (","hund","reds"," of"," MB"," /"," many"," GB",")"," can"," be"," analysed"," without"," loading"," everything"," into"," memory",","," \n","*"," performs"," the"," four"," requested"," analyses"," –"," **","word"," count"," /"," frequency",","," sentiment",","," named","‑","entity"," recognition","**,"," \n","*"," outputs"," the"," results"," to"," a"," JSON"," file"," (","you"," can"," change"," that"," to"," a"," CSV",","," plain"," text",","," or"," just"," print"," them",")"," and"," also"," shows"," a"," short"," summary"," on"," the"," console",","," \n","*"," contains"," robust"," error"," handling"," for"," IO"," problems"," and"," missing"," third","‑","party"," packages",","," and"," \n","*"," shows"," a"," small"," `","requirements",".txt","`"," so"," that"," everything"," can"," be"," installed"," in"," a"," virtual"," environment",".\n\n",">"," **","Why"," this"," design","?","**"," \n",">"," *"," **","Streaming","**"," –"," we"," never"," read"," the"," whole"," file"," into"," RAM","."," \n",">"," *"," **","Increment","al"," counting","**"," –"," `","collections",".Counter","`"," is"," updated"," for"," every"," chunk","."," \n",">"," *"," **","Stat","eless"," sentiment","**"," –"," V","ADER"," is"," fast"," and"," can"," be"," called"," on"," each"," paragraph",";"," scores"," are"," summed","."," \n",">"," *"," **","Chunk","ed"," N","ER","**"," –"," `","spa","Cy","`"," processes"," in"," a"," streaming"," way"," (`","nl","p",".pipe","`)."," \n\n","---\n\n","##"," ","1","."," File"," format","\n\n","``","`\n","#"," Plain","‑","text"," file",","," optionally"," with"," paragraphs"," separated"," by"," a"," blank"," line","\n\n","Line"," ","1",":"," This"," is"," the"," first"," sentence"," of"," the"," first"," paragraph",".\n","Line"," ","2",":"," It"," contains"," two"," sentences",".\n\n","<","blank"," line",">\n","Line"," ","3",":"," The"," second"," paragraph"," starts"," here",".\n","Line"," ","4",":"," Another"," sentence"," follows",".\n\n","``","`\n\n","*","Not"," required","*:"," you"," can"," also"," feed"," a"," single"," long"," line"," –"," the"," program"," treats"," the"," whole"," file"," as"," one"," paragraph",".\n\n","---\n\n","##"," ","2","."," Project"," layout","\n\n","``","`\n","text","_an","alyzer","/\n","│","\n","├","─"," python","_text","_an","alyzer",".py"," "," #"," ←"," main"," script","\n","├","─"," requirements",".txt","\n","�","�","─"," README",".md"," "," #"," ←"," optional",","," just"," to"," keep"," docs"," together","\n","``","`\n\n","---\n\n","##"," ","3","."," `","requirements",".txt","`\n\n","```","txt","\n","n","ltk","==","3",".","9",".","1","\n","text","blob","==","0",".","17",".","1","\n","sp","acy","==","3",".","7",".","4","\n","en","_core","_web","_sm","==","3",".","7",".","0","\n","t","q","dm","==","4",".","66",".","2","\n","``","`\n\n","Run"," once",":\n\n","```","bash","\n","python"," -","m"," v","env"," v","env","\n","source"," v","env","/bin","/","activate"," "," #"," Windows",":"," v","env","\\","Scripts","\\","activate","\n","pip"," install"," -","r"," requirements",".txt","\n","python"," -","m"," sp","acy"," download"," en","_core","_web","_sm"," "," #"," download"," the"," tiny"," model","\n","``","`\n\n","---\n\n","##"," ","4","."," `","python","_text","_an","alyzer",".py","`\n\n","```","python","\n","#!/","usr"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Chat","maxValue":346.75,"maxValueTokenIndex":406,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,99.3125,0,0,0,0,0,0,0,0,0,108.5,227.125,67.0625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,94.125,254.125,258,55.875,31.875,71.5,223.875,58.59375,83.9375,69.125,0,0,80.9375,0,60.59375,142.75,153.75,346.75,283.5,244.375,89.1875,0,0,0,0,0,34.5625,0,0,40.90625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,55.65625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,28.609375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,34.96875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,44.1875,106.625,211.5,52.5,41.15625,0,0,0,0,23.703125,0,151.875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,32.375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,47.15625,123.875,0,50.03125,73.5625,0,44.8125,0,0,0,42.5625,0,0,37.34375,0,0,0,0,67.0625,308.5,89.6875,85.875,121.8125,0,105.375,0,0,150.375,345.75,271,263.25,150.375,110.25,176,42.9375,156.125,66,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,64.75,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,84.5,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,114.75,311.5,211.625,140.5,170.625,0,193.75,32.6875,61.71875,139.75,179.5,140.5,193.875,48.28125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"imghqmrp29njvueg5gfb5rfb","tokens":["<|start|>","system","<|message|>","You"," are"," Chat","GPT",","," a"," large"," language"," model"," trained"," by"," Open","AI",".\n","Knowledge"," cutoff",":"," ","202","4","-","06","\n","Current"," date",":"," ","202","5","-","09","-","18","\n\n","Reason","ing",":"," low","\n\n","#"," Valid"," channels",":"," analysis",","," commentary",","," final","."," Channel"," must"," be"," included"," for"," every"," message",".","<|end|>","<|start|>","user","<|message|>","import"," torch","\n","import"," torch",".nn"," as"," nn","\n","from"," torch","text",".datasets"," import"," Wiki","Text","2","\n","from"," torch","text",".data",".functional"," import"," to","_map","_style","_dataset","\n","from"," torch","text",".data",".utils"," import"," get","_token","izer","\n","from"," torch","text",".v","ocab"," import"," build","_vocab","_from","_iterator","\n","from"," torch",".utils",".data"," import"," Data","Loader","\n\n","#"," ","1","."," Define"," the"," model","\n","class"," Transformer","Model","(nn",".Module","):\n"," "," def"," init","(self",","," vocab","_size",","," d","_model",","," n","head",","," num","_layers",","," dropout","=","0",".","1","):\n"," "," super","(","Transformer","Model",","," self",").","init","()\n"," "," self",".embedding"," ="," nn",".","Embedding","(v","ocab","_size",","," d","_model",")\n"," "," self",".transform","er"," ="," nn",".","Transformer","(d","_model",","," n","head",","," num","_layers",","," dropout","=","drop","out",")\n"," "," self",".fc"," ="," nn",".Linear","(d","_model",","," vocab","_size",")\n\n"," "," def"," forward","(self",","," src",","," tgt","):\n"," "," src"," ="," self",".embedding","(src",")\n"," "," tgt"," ="," self",".embedding","(t","gt",")\n"," "," x"," ="," self",".transform","er","(src",","," tgt",")\n"," "," x"," ="," self",".fc","(x",")\n"," "," return"," x","\n\n","#"," ","2","."," Prepar","ar"," datos","\n","train","_data","_raw",","," valid","_data","_raw",","," _"," ="," Wiki","Text","2","(split","=('","train","',"," '","valid","',"," '","test","'))\n","train","_data","_raw"," ="," to","_map","_style","_dataset","(train","_data","_raw",")\n","valid","_data","_raw"," ="," to","_map","_style","_dataset","(valid","_data","_raw",")\n\n","token","izer"," ="," get","_token","izer","(\"","sp","acy","\","," \"","en","_core","_web","_sm","\")\n\n","#"," Ag","regar"," tokens"," especiales"," (","UNK"," y"," PAD",")"," al"," vocab","ulario","\n","special","s"," ="," ['","<","unk",">","','","<","pad",">","']\n","v","ocab"," ="," build","_vocab","_from","_iterator","((","token","izer","(y",")"," for"," y"," in"," train","_data","_raw","),"," specials","=s","pecial","s",")\n","v","ocab",".set","_default","_index"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Chat","maxValue":346.5,"maxValueTokenIndex":329,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,38.71875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,51.8125,52.9375,0,163.75,59.0625,84.6875,51.40625,346.5,255.125,225.75,33.78125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,42.3125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"t1xcalfn8ul8392duf9nvq1u","tokens":["<|start|>","system","<|message|>","You"," are"," Chat","GPT",","," a"," large"," language"," model"," trained"," by"," Open","AI",".\n","Knowledge"," cutoff",":"," ","202","4","-","06","\n","Current"," date",":"," ","202","5","-","09","-","18","\n\n","Reason","ing",":"," high","\n\n","#"," Valid"," channels",":"," analysis",","," commentary",","," final","."," Channel"," must"," be"," included"," for"," every"," message",".","<|end|>","<|start|>","user","<|message|>","¿Qué"," le"," falta"," a"," este"," código"," para"," obtener"," una"," pred","icción"," y"," no"," <","pad",">"," <","pad",">","?:"," import"," torch","\n","import"," torch",".nn"," as"," nn","\n","import"," time","\n","from"," torch","text",".datasets"," import"," Penn","Tree","bank","\n","from"," torch","text",".data",".functional"," import"," to","_map","_style","_dataset","\n","from"," torch","text",".data",".utils"," import"," get","_token","izer","\n","from"," torch","text",".v","ocab"," import"," build","_vocab","_from","_iterator","\n","from"," torch",".utils",".data"," import"," Data","Loader","\n\n","#"," ","1","."," Define"," the"," model","\n","class"," Transformer","Model","(nn",".Module","):\n"," "," def"," __","init","__(","self",","," vocab","_size",","," d","_model",","," n","head",","," num","_layers",","," dropout","=","0",".","1","):\n"," "," super","(","Transformer","Model",","," self",").__","init","__()\n"," "," self",".embedding"," ="," nn",".","Embedding","(v","ocab","_size",","," d","_model",")\n"," "," self",".transform","er"," ="," nn",".","Transformer","(d","_model",","," n","head",","," num","_layers",","," dropout","=","drop","out",")\n"," "," self",".fc"," ="," nn",".Linear","(d","_model",","," vocab","_size",")\n\n"," "," def"," forward","(self",","," src",","," tgt","):\n"," "," src"," ="," self",".embedding","(src",")\n"," "," tgt"," ="," self",".embedding","(t","gt",")\n"," "," x"," ="," self",".transform","er","(src",","," tgt",")\n"," "," x"," ="," self",".fc","(x",")\n"," "," return"," x","\n\n\n","#"," ","2","."," Prepar","ar"," datos","\n","train","_data","_raw"," ="," to","_map","_style","_dataset","(P","enn","Tree","bank","(split","='","train","'))\n","token","izer"," ="," get","_token","izer","(\"","sp","acy","\","," \"","en","_core","_web","_sm","\")\n\n","#"," Ag","regar"," tokens"," especiales"," (","UNK"," y"," PAD",")"," al"," vocab","ulario","\n","special","s"," ="," ['","<","unk",">","','","<","pad",">","']\n","v","ocab"," ="," build","_vocab","_from","_iterator","((","token","izer","(y",")"," for"," y"," in"," train","_data","_raw","),"," specials","=s","pecial","s",")\n","v","ocab",".set","_default","_index","(v","ocab","['","<","unk",">","'])\n\n","#"," Div","idir"," los"," datos"," en"," conjuntos"," de"," entrenamiento"," y"," valid","ación","\n","train","_ratio"," ="," ","0",".","8","\n","train","_data","_size"," ="," int","(len","(train","_data","_raw",")"," *"," train","_ratio",")\n","train","_data"," ="," train","_data","_raw","[:","train","_data","_size","]\n","valid","_data"," ="," train","_data","_raw","[","train","_data","_size",":","]\n\n\n","#"," ","3","."," Entr","enar"," el"," modelo","\n","def"," generate","_pairs","(tokens",","," shift","=","1","):\n"," "," source"," ="," [","tokens","[i","]"," for"," i"," in"," range","(","0",","," len","(tokens",")"," -"," shift",")]\n"," "," target"," ="," [","tokens","[i","]"," for"," i"," in"," range","(","shift",","," len","(tokens","))]\n"," "," return"," source",","," target","\n\n","def"," tokenize","_data","(text",","," max","_seq","_len","=None","):\n"," "," tokens"," ="," tokenizer","(text",")","[:","max","_seq","_len","]\n"," "," return"," torch",".tensor","([","v","ocab","[token","]"," if"," token"," in"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Chat","maxValue":343.75,"maxValueTokenIndex":323,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,27.015625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,42.75,25.1875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,56.84375,51.4375,0,177,59.6875,88.75,55.125,343.75,249.5,220.25,31.4375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,36.6875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,44.21875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"t809ftng9j2y8uuxb1nysw7m","tokens":["<|start|>","system","<|message|>","You"," are"," Chat","GPT",","," a"," large"," language"," model"," trained"," by"," Open","AI",".\n","Knowledge"," cutoff",":"," ","202","4","-","06","\n","Current"," date",":"," ","202","5","-","09","-","18","\n\n","Reason","ing",":"," low","\n\n","#"," Valid"," channels",":"," analysis",","," commentary",","," final","."," Channel"," must"," be"," included"," for"," every"," message",".","<|end|>","<|start|>","user","<|message|>","Исп","ольз","уя"," либ","у"," English"," Spa","Cy",","," найти"," в"," тек","сте"," все"," л","екс","ем","ы",","," содержащ","ие"," только"," циф","ры",","," и"," все"," собствен","ные"," существ","ительные"," (","PRO","PN",","," они"," же"," лич","ные"," существ","ительные","),"," подс","читать"," их"," и"," вывести"," в"," HTML"," с"," прав","ым"," вы","рав","нив","анием",".","<|end|>","<|start|>","assistant","<|channel|>","analysis","<|message|>","Need"," to"," explain"," how"," to"," do"," using"," spa","Cy",","," code"," snippet",","," output"," HTML",".","<|end|>","<|start|>","assistant","<|channel|>","final","<|message|>","**","Как"," сохранить"," в"," HTML"," список"," всех"," циф","р"," и"," всех"," собствен","ных"," существ","ительных",","," найден","ных"," в"," тек","сте"," с"," помощью"," Spa","Cy","**\n\n","Н","и","же"," –"," пош","аг","овый"," пример"," (","Python"," ","3",")"," плюс"," готов","ый"," ск","рип","т",".\n","Он",":\n\n","1","."," Заг","руж","ает"," модель"," `","en","_core","_web","_sm","`"," (","или"," любую"," другую","),\n","2","."," Об","рабаты","вает"," произ","воль","ный"," текст",",\n","3","."," На","ходит"," ток","ены",","," в"," которых"," **","в","есь"," текст","**"," состоит"," из"," циф","р"," (`","\\","d","+","`","),\n","4","."," И"," на","ходит"," все"," ток","ены","‑","с","об","ственные"," существ","ительные"," (`","PRO","PN","`","),\n","5","."," С","чит","ает"," их"," количества",",\n","6","."," Форм","ирует"," HTML","‑","таб","ли","цу","/","сп","ис","ок"," и"," вы","рав","ни","вает"," конт","ент"," справа",".\n\n","---\n\n","##"," ","1","."," У","становка","\n\n","```","bash","\n","pip"," install"," sp","acy","\n","python"," -","m"," sp","acy"," download"," en","_core","_web","_sm","\n","``","`\n\n","Если"," использу","ете"," Python"," ","3",".","11","+,"," сдел","айте"," это"," в"," вирту","альном"," окруж","ении",","," чтобы"," избежать"," конфликт","ов",".\n\n","---\n\n","##"," ","2","."," Ск","рип","т","\n\n","```","python","\n","#!/","usr","/bin","/env"," python","3","\n","#"," -*-"," coding",":"," utf","-","8"," -*-\n\n","import"," re","\n","import"," sp","acy","\n","from"," pathlib"," import"," Path","\n","from"," html"," import"," escape","\n\n","#"," ","1","️⃣"," Заг","ру","жа","ем"," модель","\n","nl","p"," ="," sp","acy",".load","(\"","en","_core","_web","_sm","\")\n\n","#"," ","2","️⃣"," Т","екст",","," который"," будем"," анализ","ировать","\n","TEXT"," ="," \"\"\"\n","The"," company"," was"," founded"," in"," ","200","1"," by"," John"," Doe"," and"," Jane"," Smith",".\n","During"," the"," year"," ","202","2",","," the"," revenue"," reached"," $","5",",","000",",","000",".\n","In"," ","202","5",","," the"," new"," headquarters"," in"," New"," York"," will"," open",".\n","\"\"\"\n\n","#"," ","3","️⃣"," Об","рабаты","ваем"," текст","\n","doc"," ="," n","lp","(TEXT",")\n\n","#"," ","4","️⃣"," И","щ","ем"," только","‑","ци","ф","ров","ые"," ток","ены"," и"," собствен","ные"," существ","ительные","\n","number","_","lemma","_pattern"," ="," re",".compile","(r","'","^\\","d","+$","')\n","numbers"," ="," [","tok",".text"," for"," tok"," in"," doc"," if"," number","_","lemma","_pattern",".full","match","(tok",".text",")]\n","props"," ="," [","tok",".text"," for"," tok"," in"," doc"," if"," tok",".pos","_"," =="," \"","PRO","PN","\"]\n\n","#"," ","5","️⃣"," С","ч","ита","ем","\n","num","_of","_numbers"," ="," len","(numbers",")\n","num","_of","_props"," ="," len","(props",")\n\n","#"," ","6","️⃣"," Форм","ируем"," HTML","\n","html","_template"," ="," f","\"\"\"\n","\n","\n","\n"," "," <","meta"," charset","=\"","UTF","-","8","\">\n"," "," <","title",">","А","нал","из"," текста","\n"," "," <","style",">\n"," "," body"," {{","font","-family",":"," Arial",","," sans","-serif",";"," margin",":"," ","2","rem",";","}}\n"," "," .","right"," {{","text","-align",":"," right",";","}}\n"," "," table"," {{","border","-collapse",":"," collapse",";"," width",":"," ","100","%;","}}\n"," "," th",","," td"," {{","border",":"," ","1","px"," solid"," #","ccc",";"," padding",":"," ","0",".","5","rem",";","}}\n"," "," th"," {{","background",":"," #","f","0","f","0","f","0",";","}}\n"," "," \n","\n","\n"," "," <","h","1",">","Р","езульт","аты"," анализа","\n"," "," <","table"," class","=\"","right","\">\n"," "," <","tr","><","th",">","В","есь"," текст"," содержит"," только"," циф","ры","\n"," "," <","td",">{","num","_of","_numbers","}\n"," "," <","tr","><","th",">","С","об","ственные"," существ","ительные"," (","PRO","PN",")\n"," "," <","td",">{","num","_of","_props","}\n"," "," \n\n"," "," <","h","2",">","Под","роб","но","\n"," "," <","h","3",">","Ц","иф","ры","\n"," "," <","ul",">\n"," "," {","''.","join","(f","'<","li",">{","escape","(token",")}'"," for"," token"," in"," numbers",")}\n"," "," \n\n"," "," <","h","3",">","С","об","ственные"," существ","ительные","\n"," "," <","ul",">\n"," "," {","''.","join","(f","'<","li",">{","escape","(token",")}'"," for"," token"," in"," props",")}\n"," "," \n","\n","\n","\"\"\"\n\n","#"," ","7","️⃣"," С","ох","раня","ем"," в"," файл","\n","output","_path"," ="," Path","(\"","analysis","_results",".html","\")\n","output","_path",".write","_text","(html","_template",","," encoding","=\"","utf","-","8","\")\n\n","print","(f","\"","HTML"," сохран","ён"," в"," {","output","_path",".resolve","()","}\")\n","``","`\n\n","**","Что"," делает"," каж","дая"," часть","**\n\n","|"," #"," |"," Ш","аг"," |"," К","рат","кое"," описание"," |\n","|","---","|","-----","|","----------------","--","|\n","|","1","|","З","агрузка"," модели","|","`","nl","p"," ="," sp","acy",".load","(...)","`"," под","г","руж","ает"," ток","ен","из","атор",","," л","ем","мат","из","атор",","," POS","‑","т","ег","гер",".","|\n","|","2","|","Т","екст","|","Можно"," менять",","," даже"," подключ","ить"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Chat","maxValue":342.5,"maxValueTokenIndex":205,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,62.125,180.875,28.015625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,61.40625,0,0,0,0,0,0,0,0,0,0,0,70.375,193.375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,47.78125,127.875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,71.6875,27.71875,205.25,107.75,317.25,191.5,89.6875,342.5,254.125,237.625,154.375,96.75,69.6875,109.9375,83.875,56.71875,29.390625,0,27.625,90.375,36.875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,50.40625,0,0,0,0,0,0,0,0,0,0,112,271.5,37.96875,0,0,55.8125,53.15625,302.25,204,119.875,179.75,0,209.375,66,0,0,52.5,0,61.3125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,105.75,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,58.65625,230.125,44.6875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,133.75,142,83.125,232.625,42.9375,0,134.5,61.4375,0,141.25,220.125,141.25,0,0,0,181.625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,46.84375,0,0,0,0,0,0,122.75,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,30.6875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,36.25,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,51.625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,37.96875,153.75,0,22.59375,0,156.5,0,0,139.5,127.375,31.078125,0,31.90625,0,36.0625,82.1875,0,0,0,85.625,56.28125,0,0,0,0,32.90625,42.6875,0,0,0,0,32.53125,27.171875,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"ehvpieodjfi0o4kyhz5su6qv","tokens":["<|start|>","system","<|message|>","You"," are"," Chat","GPT",","," a"," large"," language"," model"," trained"," by"," Open","AI",".\n","Knowledge"," cutoff",":"," ","202","4","-","06","\n","Current"," date",":"," ","202","5","-","09","-","18","\n\n","Reason","ing",":"," low","\n\n","#"," Valid"," channels",":"," analysis",","," commentary",","," final","."," Channel"," must"," be"," included"," for"," every"," message",".","<|end|>","<|start|>","user","<|message|>","Develop"," a"," content","-based"," recommendation"," system"," that"," suggests"," job"," postings"," to"," candidates"," based"," on"," their"," skills"," and"," preferences"," using"," Python"," programming"," language","."," The"," system"," should"," incorporate"," natural"," language"," processing"," techniques"," to"," understand"," candidate","'s"," job"," search"," intent"," and"," generate"," personalized"," job"," recommendations","."," The"," system"," should"," also"," include"," a"," feedback"," loop"," to"," improve"," the"," relevance"," of"," recommendations"," over"," time","."," The"," output"," of"," the"," recommendation"," system"," should"," be"," presented"," in"," a"," user","-friendly"," and"," visually"," appealing"," format",".","<|end|>","<|start|>","assistant","<|channel|>","analysis","<|message|>","Need"," to"," provide"," design"," and"," code"," outline",".","<|end|>","<|start|>","assistant","<|channel|>","final","<|message|>","Below"," is"," a"," “","starter","‑","kit","”"," for"," a"," **","content","‑","based"," job","‑","posting"," recomm","ender","**"," that"," you"," can"," run"," locally"," (","or"," adapt"," to"," a"," web"," app",")."," \n","It"," uses",":\n\n","|"," Layer"," |"," Technology"," |"," Purpose"," |\n","|","-------","|","------------","|","---------","|\n","|"," **","Data","**"," |"," Pand","as",","," SQLite"," |"," Store"," job"," posts",","," candidate"," profiles",","," and"," feedback"," |\n","|"," **","N","LP","**"," |"," spa","Cy"," +"," sc","ikit","‑","learn"," TF","‑","ID","F"," |"," Turn"," job"," titles",","," descriptions",","," and"," CV"," snippets"," into"," vectors"," |\n","|"," **","Model","**"," |"," K","‑","Nearest","‑","Neighbors"," (","cos","ine"," similarity",")"," |"," Find"," most"," similar"," job"," posts"," to"," a"," candidate","’s"," vector"," |\n","|"," **","Feedback","**"," |"," SQLite"," +"," incremental"," update"," of"," the"," candidate"," vector"," |"," Let"," the"," system"," learn"," from"," clicks"," /"," \"","did","n","’t"," apply","\""," |\n","|"," **","UI","**"," |"," Stream","lit"," +"," Plot","ly"," |"," Pretty"," dashboard"," and"," interactive"," feedback"," |\n\n",">"," **","Why"," not"," a"," deep"," network","?","**"," \n",">"," For"," a"," small","‑","to","‑","medium"," sized"," company"," this"," pipeline"," offers"," the"," best"," trade","‑","off"," of"," explain","ability",","," speed",","," and"," maintain","ability","."," If"," you"," later"," collect"," millions"," of"," job"," views",","," you"," can"," replace"," the"," K","NN"," step"," with"," a"," small"," neural"," transformer"," (","e",".g",".,"," B","ERT","‑","based",")"," without"," changing"," the"," rest"," of"," the"," stack",".\n\n","---\n\n","##"," ","1","."," Project"," Structure","\n\n","``","`\n","job","-re","comm","ender","/\n","├","──"," data","/\n","│"," "," �","�","──"," jobs",".csv"," "," #"," id",","," title",","," description",","," tags",","," ...\n","│"," "," �","�","──"," candidates",".csv"," "," #"," id",","," name",","," skills",","," career","_level",","," ...\n","├","──"," models","/\n","│"," "," �","�","──"," vector","izer",".pkl"," "," #"," TF","‑","ID","F"," +"," pre","‑","processing"," pipeline","\n","├","──"," stream","lit","_app",".py","\n","├","──"," requirements",".txt","\n","�","�","──"," README",".md","\n","``","`\n\n","---\n\n","##"," ","2","."," Data","\n\n","###"," ","2",".","1"," Job"," Post","ings"," (`","jobs",".csv","`",")\n\n","|"," Column"," |"," Type"," |"," Description"," |\n","|","--------","|","------","|","-------------","|\n","|"," `","job","_id","`"," |"," int"," |"," Unique"," DB"," id"," |\n","|"," `","title","`"," |"," string"," |"," Title"," of"," the"," position"," |\n","|"," `","description","`"," |"," string"," |"," Full"," job"," description"," |\n","|"," `","skills","`"," |"," string"," |"," CSV"," of"," required"," skills"," (","e",".g",".,"," `\"","python",","," data"," analysis",","," sql","\"","`)"," |\n","|"," `","location","`"," |"," string"," |"," e",".g",".,"," `\"","San"," Francisco",","," CA","\"`"," |\n","|"," `","remote","_type","`"," |"," string"," |"," `\"","remote","\""," |"," \"","hy","brid","\""," |"," \"","ons","ite","\"`"," |\n","|"," `","tags","`"," |"," string"," |"," e",".g",".,"," `\"","machine","-learning",","," backend",","," full","-stack","\"`"," |\n\n","###"," ","2",".","2"," Candidate"," Profiles"," (`","c","andidates",".csv","`",")\n\n","|"," Column"," |"," Type"," |"," Description"," |\n","|","--------","|","------","|","-------------","|\n","|"," `","cand","_id","`"," |"," int"," |"," Unique"," id"," |\n","|"," `","name","`"," |"," string"," |"," Candidate"," name"," |\n","|"," `","skills","`"," |"," string"," |"," CSV"," skills"," |\n","|"," `","desired","_role","`"," |"," string"," |"," “","Data"," Scientist","”,"," “","Full"," Stack"," Engineer","”,"," etc","."," |\n","|"," `","preferred","_location","`"," |"," string"," |"," `\"","Remote","\"","`,"," `\"","City"," A","\"","`,"," etc","."," |\n","|"," `","experience","_year","s","`"," |"," int"," |"," Years"," of"," professional"," experience"," |\n","|"," `","career","_level","`"," |"," string"," |"," “","Junior","”,"," “","Mid","”,"," “","Senior","”,"," etc","."," |\n\n",">"," **","Tip",":**"," If"," you"," have"," PDFs"," of"," resumes"," or"," Linked","In"," profiles",","," let"," spa","Cy"," parse"," them"," into"," the"," `","skills","`"," field"," first","."," That"," gives"," you"," an"," auto","‑","filled"," `","skills","`"," column",".\n\n","---\n\n","##"," ","3","."," NLP"," Pre","‑","Processing"," Pipeline","\n\n","```","python","\n","#"," preprocess",".py","\n","import"," re","\n","import"," sp","acy","\n","from"," sklearn",".feature","_ex","traction",".text"," import"," T","fid","f","Vector","izer","\n","import"," pickle","\n","from"," pathlib"," import"," Path","\n\n","nl","p"," ="," sp","acy",".load","(\"","en","_core","_web","_sm","\")\n\n","def"," clean","_text","(text","):\n"," "," #"," Basic"," cleaning",","," le","mmat","ization",","," stop","‑","word"," removal","\n"," "," doc"," ="," n","lp","(text",".lower","())\n"," "," tokens"," ="," [","token",".","lemma","_"," for"," token"," in"," doc"," if"," not"," token",".is","_stop"," and"," not"," token",".is","_p","unct","]\n"," "," return"," \""," \".","join","(tokens",")\n\n","def"," build","_vector","izer","(df"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Chat","maxValue":336.75,"maxValueTokenIndex":891,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,25.296875,57.96875,241,32.75,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,27.546875,137.375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,65.5625,0,0,23.015625,0,0,0,0,0,0,101.8125,272.5,65.8125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,65.1875,170.5,61.09375,0,179.5,269.75,219,44.03125,336.75,46.0625,211.5,47.5625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,28.625,42.125,0,119.3125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,22.765625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"x3pfd784icus6m6lj8g47slh","tokens":["<|start|>","system","<|message|>","You"," are"," Chat","GPT",","," a"," large"," language"," model"," trained"," by"," Open","AI",".\n","Knowledge"," cutoff",":"," ","202","4","-","06","\n","Current"," date",":"," ","202","5","-","09","-","18","\n\n","Reason","ing",":"," low","\n\n","#"," Valid"," channels",":"," analysis",","," commentary",","," final","."," Channel"," must"," be"," included"," for"," every"," message",".","<|end|>","<|start|>","user","<|message|>","Develop"," a"," software"," tool"," that"," can"," effectively"," analyze"," textual"," documents"," and"," determine"," the"," most"," frequent"," and"," significant"," words"," and"," phrases"," used"," within"," the"," document","."," The"," software"," should"," be"," able"," to"," identify"," both"," individual"," words"," and"," phrases"," that"," are"," commonly"," used"," within"," the"," document",","," providing"," a"," summary"," of"," the"," text"," content","."," Additionally",","," the"," tool"," should"," have"," built","-in"," algorithms"," to"," recognize"," different"," forms"," of"," the"," same"," word",","," such"," as"," plur","als"," or"," verb"," t","enses",","," to"," ensure"," that"," the"," most"," accurate"," analysis"," is"," provided","."," Finally",","," the"," software"," should"," have"," an"," easy","-to","-use"," interface"," that"," allows"," users"," to"," enter"," a"," document"," or"," multiple"," documents"," to"," be"," analyzed"," and"," view"," the"," resulting"," keyword"," and"," phrase"," analysis",".","<|end|>","<|start|>","assistant","<|channel|>","analysis","<|message|>","Need"," to"," propose"," software"," design",","," components",","," algorithms",","," interface",".","<|end|>","<|start|>","assistant","<|channel|>","final","<|message|>","##"," Project"," Overview"," \n","**","Name",":**"," *","Lex","i","Scope","*"," –"," a"," text","‑","analysis"," engine"," that"," surfaces"," the"," most"," frequent"," and"," sem","antically","‑","important"," words"," &"," phrases"," in"," one"," or"," many"," documents",","," normal","izes"," inf","lections",","," and"," presents"," the"," findings"," through"," an"," intuitive"," UI",".\n\n",">"," **","Goal","**"," –"," Deliver"," a"," self","‑","contained",","," platform","‑","agn","ostic"," tool"," that"," can"," be"," used"," by"," researchers",","," marketers",","," writers",","," and"," developers"," to"," quickly"," discover"," the"," \"","v","ocab","\""," that"," matters"," in"," a"," body"," of"," text",".\n\n","---\n\n","##"," ","1","."," Core"," Functional","ities","\n\n","|"," #"," |"," Feature"," |"," What"," it"," does"," |"," Key"," Technology"," |\n","|","---","|","---------","|","--------------","|","----------------","|\n","|"," ","1"," |"," **","Document"," ingestion","**"," |"," Accept"," single"," or"," multiple"," files"," (","TXT",","," PDF",","," DOC","X",","," HTML",","," Markdown",","," etc",".)"," |"," Apache"," T","ika"," (","Java","/P","ython",")"," or"," doc","x","2","txt"," /"," pdf","miner"," |\n","|"," ","2"," |"," **","Token","ization","**"," |"," Split"," text"," into"," words",","," n","‑","grams"," (","2","‑","grams",","," ","3","‑","grams",")."," |"," spa","Cy"," /"," N","LT","K"," |\n","|"," ","3"," |"," **","Normalization"," /"," Lem","mat","ization","**"," |"," Reduce"," inf","lections"," to"," lemma"," (","e",".g",".,"," *","running"," →"," run","*",")."," |"," spa","Cy"," (","en","_core","_web","_sm",")"," or"," spa","Cy"," +"," Text","Blob"," |\n","|"," ","4"," |"," **","Stop","‑","word"," &"," noise"," removal","**"," |"," Remove"," very"," common"," words",","," numbers",","," punctuation"," |"," Custom"," stop","‑","list"," +"," regex"," |\n","|"," ","5"," |"," **","Frequency"," count","**"," |"," Count"," term",","," big","ram",","," trig","ram"," frequencies"," across"," one"," or"," many"," docs"," |"," Counter"," (","Python",")"," |\n","|"," ","6"," |"," **","TF","‑","ID","F"," weighting"," (","optional",")**"," |"," Rank"," terms"," by"," document","‑","specific"," importance"," |"," sc","ikit","‑","learn"," T","fid","f","Vector","izer"," |\n","|"," ","7"," |"," **","Phrase"," relevance"," scoring","**"," |"," Penal","ize"," content"," words"," that"," appear"," only"," once",","," boost"," n","‑","grams"," with"," high"," pair","wise"," similarity"," |"," J","acc","ard","/I","QR"," or"," Point","wise"," Mutual"," Information"," (","PM","I",")"," |\n","|"," ","8"," |"," **","Result"," presentation","**"," |"," Frequency"," tables",","," charts",","," tag"," clouds",","," ranked"," lists"," |"," Chart",".js"," /"," D","3",".js"," (","web",")"," or"," Mat","plotlib"," (","desktop",")"," |\n","|"," ","9"," |"," **","Export","**"," |"," CSV",","," JSON",","," or"," downloadable"," PDF"," summary"," |"," pandas",".to","_csv"," /"," Report","Lab"," |\n\n","---\n\n","##"," ","2","."," System"," Architecture","\n\n","``","`\n","�","�","────────────────","────────────────","────────────────","────","�","�","\n","│"," "," User"," Interface"," (","UI",")"," "," │","\n","│"," "," (","Web"," or"," Desktop",")"," "," •"," Upload"," documents"," "," │","\n","│"," "," •"," Configure"," settings"," "," │","\n","│"," "," •"," View"," results"," "," │","\n","�","�","────","──","─","▲","────────────────","────","──","▲","────────────────","────","─","�","�","\n"," "," │"," "," │","\n"," "," │"," HTTP"," /"," IPC"," "," │","\n"," "," ▼"," "," ▼","\n","�","�","────────────────","─","�","�"," "," �","�","────────────────","─","�","�","\n","│"," "," Front","‑","End"," API"," "," │"," "," │"," "," Backend"," API"," "," │","\n","│"," "," (","REST","/","Graph","QL",")","│"," "," │"," (","Python","/","Go",")"," "," │","\n","�","�","────","──","─","▲","────────","─","�","�"," "," �","�","────","──","─","▲","────────","─","�","�","\n"," "," │"," "," │","\n"," "," │"," "," Calls"," Service"," Layer"," │","\n"," "," ▼"," "," ▼","\n","�","�","────────────────","────","──","─","�","�"," "," �","�","────────────────","────","──","─","�","�","\n","│"," "," Text","‑","Processing"," Layer"," │"," "," │"," "," Storage"," Layer"," (","B","‑","s",")"," "," │","\n","│"," "," •"," In","gest",","," parse",","," "," │"," "," │"," "," •"," Metadata",","," raw"," text"," "," │","\n","│"," "," •"," Token","ize",","," normalize"," │"," "," │"," "," •"," Frequency"," tables"," "," │","\n","│"," "," •"," Count"," &"," score"," "," │"," "," │"," "," •"," User"," configs"," "," │","\n","�","�","────────────────","────","──","─","�","�"," "," �","�","────────────────","────","──","─","�","�","\n","``","`\n\n","*"," **","Front","‑","end"," (","React","/V","ue",")**"," –"," Single","‑","page"," UI"," with"," drag","‑","and","‑","drop",","," bulk"," upload",","," and"," real","‑","time"," progress",".\n","*"," **","Back","‑","end","**"," –"," A"," lightweight"," service"," (","Python"," Fast","API"," or"," Go"," Gin",")."," \n"," "," *"," Handles"," file"," I","/O",","," launches"," spa","Cy"," pipelines",","," stores"," per","‑","document"," stats"," in"," SQLite"," or"," embedded"," Rocks","DB",".\n"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Chat","maxValue":327.25,"maxValueTokenIndex":450,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,98.8125,192.5,33.625,0,0,49.0625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,27.484375,65.0625,210.25,82.125,76.75,327.25,258,214.75,65.125,26.890625,0,181.625,42.65625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,40.53125,180,88.1875,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"rbcwj2f46orokox5gfzmm97i","tokens":["<|start|>","system","<|message|>","You"," are"," Chat","GPT",","," a"," large"," language"," model"," trained"," by"," Open","AI",".\n","Knowledge"," cutoff",":"," ","202","4","-","06","\n","Current"," date",":"," ","202","5","-","09","-","18","\n\n","Reason","ing",":"," medium","\n\n","#"," Valid"," channels",":"," analysis",","," commentary",","," final","."," Channel"," must"," be"," included"," for"," every"," message",".","<|end|>","<|start|>","user","<|message|>","Provide"," step","-by","-step"," instructions"," for"," setting"," up"," G","ens","im"," in"," a"," Python"," environment",","," specifying"," how"," to"," load"," and"," preprocess"," various"," types"," of"," text"," corp","ora","."," Explain"," the"," different"," topic"," modeling"," algorithms"," supported"," by"," G","ens","im",","," and"," how"," to"," choose"," and"," evaluate"," the"," best"," one"," for"," a"," given"," corpus","."," Show"," how"," to"," train"," and"," save"," word"," embeddings"," using"," G","ens","im",","," including"," options"," for"," defining"," the"," embedding"," dimension",","," context"," window"," size",","," and"," training"," method","."," Provide"," examples"," of"," how"," to"," use"," the"," resulting"," topic"," models"," and"," word"," embeddings"," for"," tasks"," such"," as"," document"," classification",","," semantic"," similarity",","," and"," word"," analogy",".","<|end|>","<|start|>","assistant","<|channel|>","analysis","<|message|>","We"," need"," to"," provide"," step","-by","-step"," instructions"," for"," setting"," up"," G","ens","im",","," loading"," and"," preprocessing"," corp","ora",","," explain"," topic"," modeling"," algorithms",","," choose"," and"," evaluate",","," train"," and"," save"," word"," embeddings",","," options"," like"," dimension",","," window",","," training"," method"," (","CB","OW","/","skip","-","gram","),"," then"," show"," usage"," in"," classification",","," similarity",","," word"," analogy","."," Might"," require"," code"," snippets","."," Should"," cover"," environment"," config",","," pip"," install",","," use"," virtual","env"," or"," con","da","."," Use"," pre","-processing",":"," token","ization",","," lower","c","asing",","," stop","words"," removal",","," le","mmat","ization"," using"," spa","Cy"," or"," N","LT","K","."," Topic"," modeling",":"," L","SI",","," L","DA",","," HD","P",","," CT","M"," etc","."," Evaluate"," using"," perplex","ity",","," coherence",","," test"," set"," classification","."," Word"," embeddings",":"," Word","2","Vec",","," Fast","Text",","," Doc","2","Vec","."," Show"," training",","," saving",","," loading","."," Provide"," examples"," of"," classification"," with"," sc","ikit","-le","arn"," logistic"," regression"," using"," inferred"," topic"," vectors"," or"," embeddings"," bag","-of","-","words","."," Semantic"," similarity",":"," gens","im"," similarity"," queries","."," Word"," analogy",":"," model",".w","v",".m","ost","_sim","ilar","(","positive","=['","king","',"," '","woman","'],"," negative","=['","man","'])."," Also"," show"," word"," analogy"," with"," doc","2","vec","?"," We'll"," include"," usage"," with"," gens","im",".models",".Word","2","Vec","."," Provide"," guidance"," on"," hyper","parameters","."," Provide"," scripts","."," Should"," also"," show"," recognizing"," corp","ora",":"," plain"," text",","," csv",","," json",","," scr","apped",","," gens","im",".c","orp","ora","."," Provide"," grammar",".\n\n","Make"," it"," step","-by","-step"," listing",".\n\n","Consider"," easy"," to"," read"," sections","."," Use"," code"," fences",".\n\n","Ok","."," Let's"," do",".","<|end|>","<|start|>","assistant","<|channel|>","final","<|message|>","##"," ","1","."," "," Getting"," G","ens","im"," –"," the"," “","install","‑","first","”"," box","\n\n","Below"," you","’ll"," find"," a"," **","bash","‑","style","**"," (","Linux","/mac","OS","/","WS","L",")"," and"," a"," **","Windows","‑","CMD","**"," recipe","."," \n","They"," create"," a"," clean"," virtual"," environment",","," install"," G","ens","im"," **","and","**"," the"," most"," common"," NLP"," tools"," we","’ll"," need"," later",".\n\n","|"," |"," Linux","/mac","OS","/","WS","L"," |"," Windows"," |\n","|","---","|","---","|","---","|\n","|","**","Create"," &"," activate"," a"," virt","‑","env","**","|","```","bash","\\n","python","3"," -","m"," v","env"," gens","im","_env","\\n","source"," gens","im","_env","/bin","/","activate","\\n","```","|","```","bat","\\n","python"," -","m"," v","env"," gens","im","_env","\\","ng","ens","im","_env","\\","Scripts","\\","activate","\\n","```","|\n","|","**","Upgrade"," pip","**","|","```","bash","\\n","pip"," install"," -","U"," pip","\\n","```","|","```","bat","\\n","pip"," install"," -","U"," pip","\\n","```","|\n","|","**","Install"," core"," stack","**","|","```","bash","\\n","pip"," install"," gens","im","==","4",".","2",".","0"," "," #"," latest"," L","TS"," as"," of"," ","202","5","-","08","\\n","pip"," install"," numpy"," scipy"," pandas"," tqdm","\\n","pip"," install"," sp","acy","==","3",".","6"," "," #"," for"," le","mmat","ization","\\n","```","|","```","bat","\\n","pip"," install"," gens","im","==","4",".","2",".","0","\\n","pip"," install"," numpy"," scipy"," pandas"," tqdm","\\n","pip"," install"," sp","acy","==","3",".","6","\\n","```","|\n","|","**","Download"," spa","Cy"," model","**","|","```","bash","\\n","python"," -","m"," sp","acy"," download"," en","_core","_web","_sm","\\n","```","|","```","bat","\\n","python"," -","m"," sp","acy"," download"," en","_core","_web","_sm","\\n","```","|\n\n",">"," **","Tip",":**"," If"," you"," want"," to"," experiment"," with"," **","fast","Text","**"," or"," **","Open","AI","‑","style"," embeddings","**"," later",","," also"," `","pip"," install"," fast","text","==","0",".","9",".","2","`"," (","or"," the"," newer"," `","fast","text","`"," package",")"," and"," `","pip"," install"," sentence","-transform","ers","`.\n\n","---\n\n","##"," ","2","."," "," Loading"," &"," preprocessing"," a"," text"," corpus","\n\n","G","ens","im"," works"," with"," **","cor","pora","**"," that"," are"," list","‑","like"," collections"," of"," token","ized"," documents","."," \n","Below"," are"," common"," ways"," to"," build"," this"," list",","," followed"," by"," a"," canonical"," preprocessing"," pipeline",".\n\n","###"," ","2",".","1"," "," From"," a"," plain","‑","text"," file","\n\n","```","python","\n","import"," pathlib","\n","from"," gens","im",".utils"," import"," simple","_pre","process","\n\n","cor","pus","_path"," ="," pathlib",".Path","('","data","')\n","docs"," ="," []\n\n","for"," txt","_file"," in"," corpus","_path",".glob","('","*.","txt","'):\n"," "," with"," open","(txt","_file",","," encoding","='","utf","-","8","')"," as"," f",":\n"," "," docs",".append","(f",".read","())\n\n","#"," quick"," token","ization"," –"," keeps"," only"," alphabet","ic"," tokens",","," lower","‑","cases"," automatically","\n","token","ized","_docs"," ="," [","simple","_pre","process","(d",","," de","acc","=True",")"," for"," d"," in"," docs","]\n","``","`\n\n","###"," ","2",".","2"," "," From"," a"," CSV"," /"," TSV"," –"," one"," column"," per"," document","\n\n","```","python","\n","import"," pandas"," as"," pd","\n","from"," gens","im",".utils"," import"," simple","_pre","process","\n\n","df"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Chat","maxValue":326.25,"maxValueTokenIndex":740,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,22.5,0,0,0,0,0,0,43.9375,0,0,0,0,31,52.0625,104.75,206.25,29.984375,0,0,79.9375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,44.1875,0,0,60.34375,81,0,0,28.65625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,81.8125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,128.875,300.5,0,63.375,104.125,0,0,39.21875,77.375,0,0,56.875,43.125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,72.25,0,0,0,0,0,0,0,0,0,221,0,55.9375,0,0,0,0,0,0,0,126.25,125.9375,315.25,326.25,85.625,0,0,0,67.5625,0,170.25,62.375,73.0625,279.75,217.5,110.4375,316.75,239.875,223.5,88.3125,0,0,0,0,0,0,0,60.9375,0,204.125,165.75,0,60,29.015625,173.625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,31.3125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,32.53125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,35.09375,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"u4f1083819ar70h12baerehj","tokens":["<|start|>","system","<|message|>","You"," are"," Chat","GPT",","," a"," large"," language"," model"," trained"," by"," Open","AI",".\n","Knowledge"," cutoff",":"," ","202","4","-","06","\n","Current"," date",":"," ","202","5","-","09","-","18","\n\n","Reason","ing",":"," low","\n\n","#"," Valid"," channels",":"," analysis",","," commentary",","," final","."," Channel"," must"," be"," included"," for"," every"," message",".","<|end|>","<|start|>","user","<|message|>","假","如","给","你","很多","的","中文","查询","句","子","，这","些","查询","句","子的","结构","有","很多","，有","些","查询","句","子的","结构","相","似","，有","些","则","不","相","似","，请","问","怎么","把","这些","查询","句","子","进行","分类","，让","结构","相","似","的","查询","句","子","分","到","一起","。","通过","查询","句","子的","结构","相","似","度","进行","聚","类","，而","不是","通过","句","子","语","义","相","似","度","进行","聚","类","，请","用","nl","p","方法","。","请","写","出","完整","的","代码","<|end|>","<|start|>","assistant","<|channel|>","analysis","<|message|>","Need"," to"," explain"," approach"," and"," provide"," code"," using"," spa","Cy"," or"," Transformer"," parse"," trees","."," Provide"," clustering"," using"," sentence"," parse"," trees",","," computing"," similarity"," via"," distances"," between"," dependency"," trees","."," Use"," Tree"," Edit"," Distance"," or"," Le","vens","hte","in"," of"," dependency"," string","."," Provide"," example","."," Let's"," write"," code"," using"," spa","Cy"," to"," get"," dependency"," parse"," tree",","," convert"," to"," adjacency"," list",","," compute"," tree"," edit"," distance"," using"," z","ss"," library","."," Then"," cluster"," via"," Agg","lomer","ative","Cl","ustering"," using"," distance"," matrix","."," Provide"," example"," sentences",".","<|end|>","<|start|>","assistant","<|channel|>","final","<|message|>","下面","给","出","一种"," **","基","于","句","子","依","存","树","结构","相","似","度","**"," 的","聚","类","完整","思","路","和","实现","代码","。"," \n","思","路","概","览","\n\n","|"," �","�","骤"," |"," ","说明"," |"," ","主要","实现"," |\n","|","------","|","------","|","----------","|\n","|"," ","1","."," ","预","处理"," |"," ","读取","中文","查询","句","子","，并","使用"," **","sp","acy","**"," +"," `","zh","_core","_web","_sm","`","（","中文","模型","）","做","分","词"," +"," ","依","存","句","法","分析"," |"," `","sp","acy",".load","(\"","zh","_core","_web","_sm","\")","`"," |\n","|"," ","2","."," �","�","依","存","树","转","成","可","度","量","结构"," |"," ","①"," 将","每","个"," token"," 的"," `","head",".i","`"," 与","自身"," `","i","`"," ","组成","父","–","子","图","。","<","br",">","②"," ","生成","一个","树","的"," **","字符串","表示","**","（","例如"," `","[(","head",",","dep",",","child",")...","]","`","）","或者","构","造","树","对象","供","后","续","编辑","距离","计算"," |"," ","代码","中","实现"," `","tree","_to","_tuple","()`"," �","�","树","转","成","可","序","列","化","形式"," |\n","|"," ","3","."," ","计算","树","编辑","距离"," |"," 使用","开","源","的"," **","z","ss","**","（","Z","hang","‑","Sh","asha"," Tree"," Edit"," Distance","）","库","计算","两","�","�","树","的","最","小","编辑","距离","，","距离","越","小","代表","结构","越","相","似","。"," |"," `","z","ss",".simple","_distance","(tree","A",","," tree","B",","," ...)","`"," |\n","|"," ","4","."," �","�","建","距离","矩","阵"," |"," 对","所有","句","子"," pair","wise"," ","计算","编辑","距离","，","得到"," Nx","N"," 的","对","称","距离","矩","阵","。"," |"," �","�","环","计算","并","存","进"," Num","Py"," 数","组"," |\n","|"," ","5","."," 聚","类"," |"," ","直接","使用"," **","Agg","lomer","ative","Cl","ustering","**","（","层","次","聚","类","）"," 或","者"," **","DB","SCAN","**","（","若","你","想","基","于","距离","�","�","值","直接","分","�","�","）。","这里","演","示"," Agg","lomer","ative","Cl","ustering"," ","以"," `","aff","inity","='","pre","computed","'","`"," ","形式","输入","自","定义","距离","矩","阵","。"," |"," `","Agg","lomer","ative","Cl","ustering","(n","_clusters","=None",","," distance","_threshold","=","�","�","值",","," affinity","='","pre","computed","',"," linkage","='","average","')","`"," |\n","|"," ","6","."," 输出"," |"," 根据","聚","类","结果","把","相","似","结构","的","查询","句","子","聚","在","一起","打印","展示","。"," |"," 简","单","的","循环","打印","各","�","�"," |\n\n","下面","给","出","完整","可","直接","运行","的"," Python"," ","代码","（","需要","额","外","安装"," `","sp","acy","`,"," `","zh","_core","_web","_sm","`,"," `","z","ss","`,"," `","sc","ikit","-le","arn","`","）。"," \n\n","```","python","\n","#"," =================================================================","=====\n","#"," ","依","存","树","结构","相","似","度","聚","类","示","例","\n","#"," =================================================================","=====\n","import"," sp","acy","\n","import"," z","ss","\n","import"," numpy"," as"," np","\n","from"," sklearn",".cluster"," import"," Agg","lomer","ative","Cl","ustering","\n","from"," tqdm"," import"," tqdm","\n\n","#"," ----------------","-----"," ","1","."," ","载","入","中文","模型"," ----------------","-----\n","#"," 若","没","安装","，请","先","运行","：\n","#"," "," pip"," install"," -","U"," sp","acy","\n","#"," "," python"," -","m"," sp","acy"," download"," zh","_core","_web","_sm","\n","nl","p"," ="," sp","acy",".load","(\"","zh","_core","_web","_sm","\")\n\n","#"," ----------------","-----"," ","2","."," ","读取","/","准备","示","例","查询","句","子"," ----------------","-----\n","queries"," ="],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Chat","maxValue":315.5,"maxValueTokenIndex":825,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,73.25,202,30.296875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,76.5625,189.5,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,27.578125,0,0,0,0,0,0,0,0,0,49.25,0,49.40625,230.25,49.03125,31.953125,70.25,38.15625,285,279.5,256,142,86.4375,67.3125,208.125,70.9375,26.671875,0,0,0,0,0,0,0,0,27.53125,0,26.546875,0,211,204.25,184.125,0,0,0,236.875,83,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,50.1875,0,0,0,110,0,0,0,56.3125,276,0,0,23.71875,26.875,135.25,268.5,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,69.125,258.25,69,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,30.5625,75.5625,73.1875,224.25,0,57.3125,79.8125,66.875,40.375,65.6875,0,0,0,0,0,28.640625,0,0,55.3125,0,72.4375,270.75,0,44.375,88.9375,0,56.0625,79.0625,67,315.5,213.75,0,0,0,216.875,46.65625,78,127.5,69.0625,0,144,237.875,160.375,0,0,0,172.25,43.8125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"meazf9ux3m8r9vlmdmsxxwd4","tokens":["<|start|>","system","<|message|>","You"," are"," Chat","GPT",","," a"," large"," language"," model"," trained"," by"," Open","AI",".\n","Knowledge"," cutoff",":"," ","202","4","-","06","\n","Current"," date",":"," ","202","5","-","09","-","18","\n\n","Reason","ing",":"," low","\n\n","#"," Valid"," channels",":"," analysis",","," commentary",","," final","."," Channel"," must"," be"," included"," for"," every"," message",".","<|end|>","<|start|>","user","<|message|>","Besides"," nltk",","," is"," there"," any"," other"," python"," package"," which"," can"," remove"," stop","words","?","<|end|>","<|start|>","assistant","<|channel|>","analysis","<|message|>","Need"," to"," list"," other"," packages",":"," spa","Cy",","," gens","im",","," text","acy",","," sc","ikit","-le","arn",","," stop","-","words",","," N","LT","K"," alternatives","."," Provide"," usage",".","<|end|>","<|start|>","assistant","<|channel|>","final","<|message|>","Absolutely","!"," While"," the"," **","NL","TK","**"," library"," is"," the"," classic"," go","‑","to"," for"," text"," preprocessing"," in"," Python",","," there"," are"," a"," handful"," of"," other"," libraries"," that"," can"," do"," the"," same"," job"," of"," filtering"," out"," stop","‑","words","."," Below"," is"," a"," quick"," guide"," that"," shows"," you"," the"," most"," widely"," used"," alternatives",","," how"," to"," install"," them",","," and"," a"," minimal"," example"," of"," how"," to"," strip"," stop","‑","words"," with"," each"," one",".\n\n","|"," Library"," |"," Key"," Strength","s"," |"," Typical"," use"," case"," |"," Install"," command"," |"," Quick"," snippet"," |\n","|","---------","|","---------------","|","----------------","--","|","----------------","-|","---------------","|\n","|"," **","spa","Cy","**"," |"," Fast",","," production","‑","ready",","," built","‑","in"," language"," models"," with"," a"," lot"," of"," linguistic"," tools"," |"," Large","‑","scale"," NLP"," pipelines",","," token","ization"," +"," POS"," tagging"," |"," `","pip"," install"," sp","acy","`"," |"," `"," [","token",".text"," for"," token"," in"," doc"," if"," not"," token",".is","_stop","]","`"," |\n","|"," **","gens","im","**"," |"," Optim","ized"," for"," large"," corp","ora",","," word","‑","embedding"," training"," |"," Topic"," modeling"," &"," large","‑","scale"," text"," analytics"," |"," `","pip"," install"," gens","im","`"," |"," `"," [","word"," for"," word"," in"," doc"," if"," word"," not"," in"," stop","list","]","`"," |\n","|"," **","sc","ikit","‑","learn","**"," |"," BSD","‑","licensed",","," great"," if"," you","’re"," already"," using"," it"," for"," ML"," |"," Text"," vector","ization"," for"," ML"," models"," |"," `","pip"," install"," sc","ikit","-le","arn","`"," |"," `","vector","izer"," ="," Count","Vector","izer","(stop","_words","='","english","')","`"," |\n","|"," **","text","acy","**"," |"," Wrapper"," around"," spa","Cy"," that"," adds"," handy"," utilities"," |"," Fast"," stop","‑","word"," removal",","," le","mmat","ization",","," N","ER",","," FO"," |"," `","pip"," install"," text","acy","`"," |"," `"," text","acy",".preprocessing",".remove","_stop","words","(text",","," lang","='","en","')","`"," |\n","|"," **","stop","-","words","**"," (","pip",":"," `","stop","-","words","`)"," |"," Small"," dependency",","," plain"," list"," of"," stop","‑","words"," for"," many"," languages"," |"," Quick"," filtering"," without"," extra"," dependencies"," |"," `","pip"," install"," stop","-","words","`"," |"," `"," [","w"," for"," w"," in"," tokens"," if"," w"," not"," in"," stop","_words","]","`"," |\n","|"," **","simple","‑","nl","p","**"," |"," Minimal"," API",","," good"," for"," quick"," scripts"," |"," Basic"," NLP",","," including"," stop","‑","word"," removal"," |"," `","pip"," install"," simple","-n","lp","`"," |"," `","token","izer",".remove","_stop","_words","(text",")`"," |\n","|"," **","fst","ail","**"," |"," Fast"," text"," processing"," for"," very"," large"," texts"," |"," High","‑","through","put"," pipelines"," |"," `","pip"," install"," f","sta","id","`"," |"," `"," [","w"," for"," w"," in"," words"," if"," w"," not"," in"," f","sta","id",".stop","_words","]","`"," |\n","|"," **","lang","chain","**"," |"," Part"," of"," the"," Lang","Chain"," ecosystem",","," includes"," stop","‑","word"," lists"," |"," Prompt"," engineering"," &"," L","LM"," pipelines"," |"," `","pip"," install"," lang","chain","`"," |"," `","lang","chain",".utils",".helpers",".remove","_stop","words","(text",")`"," |\n\n","---\n\n","##"," ","1","."," spa","Cy","\n\n","```","bash","\n","pip"," install"," sp","acy","\n","python"," -","m"," sp","acy"," download"," en","_core","_web","_sm"," "," #"," download"," a"," small"," English"," model","\n","``","`\n\n","```","python","\n","import"," sp","acy","\n\n","nl","p"," ="," sp","acy",".load","(\"","en","_core","_web","_sm","\")\n\n","text"," ="," \"","The"," quick"," brown"," fox"," jumps"," over"," the"," lazy"," dog",".\"\n","doc"," ="," n","lp","(text",")\n\n","clean","_tokens"," ="," [","token",".text"," for"," token"," in"," doc"," if"," not"," token",".is","_stop","]\n","print","(clean","_tokens",")\n","#"," Output",":"," ['","quick","',"," '","brown","',"," '","fox","',"," '","j","umps","',"," '","lazy","',"," '","dog","',"," '.","']\n","``","`\n\n","*","Why"," choose"," spa","Cy","?","*"," \n","-"," Extremely"," fast"," token","ization"," (~","10","‑","15"," ","M"," tokens","/sec",")."," \n","-"," Built","‑","in"," stop","‑","word"," lists"," for"," many"," languages","."," \n","-"," Good"," default"," POS"," tags",","," N","ER",","," dependency"," parsing"," for"," downstream"," tasks",".\n\n","---\n\n","##"," ","2","."," gens","im","\n\n","```","bash","\n","pip"," install"," gens","im","\n"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Chat","maxValue":311,"maxValueTokenIndex":654,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,44.3125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,97,229.75,38.25,0,0,0,0,40.375,26.15625,0,0,0,0,0,0,0,0,0,0,28.96875,67.25,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,77.6875,0,32.84375,0,0,0,0,0,0,35.4375,0,0,0,0,0,35.28125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,27.546875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,102,262.75,49.78125,36.6875,117.1875,168.125,77.875,24.796875,56.21875,151.75,103.4375,117.5625,115.125,136.125,220.75,124.875,108.625,39.4375,124.4375,62.25,73.125,0,58.59375,0,51.28125,50.375,90.25,79.125,0,36.03125,0,0,0,0,0,0,0,78.375,239.875,0,0,39.15625,0,0,0,0,0,0,36.28125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,39.375,0,43.125,0,26.546875,66.3125,191.5,27.765625,27.234375,0,0,0,26.25,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,31.15625,0,0,0,0,28.890625,0,0,0,0,0,0,75.375,42,37.75,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,24.625,29.203125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,32.15625,195.25,0,0,56.5,0,0,0,80.8125,231.125,27.15625,0,0,57.46875,39.28125,259.5,222.25,124.9375,311,273.25,234.625,55.15625,87.375,164.375,203.875,136.25,82.5625,228.625,62.46875,0,0,0,0,0,0,48.9375,208.25,28.8125,0,117.6875,68.125,0,133.25,216.75,168.25,0,88.5,42.625,199,23.296875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,108.75,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,29.40625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,33.0625,162.625,0,0,0,68.125,76.3125,38.8125,0,0,29.234375,0,0,0,0,0,0,0,0,0,114.6875,48.59375,70.75,86.5,0,0,40,24.03125,42.9375,55.1875,40.625,0,35.71875,84.25,49,72.25,0,0,35.53125,0,34.6875,53.46875,0,50.28125,55.53125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"ri66b9vsooxluaiq81gqnsmh","tokens":["<|start|>","system","<|message|>","You"," are"," Chat","GPT",","," a"," large"," language"," model"," trained"," by"," Open","AI",".\n","Knowledge"," cutoff",":"," ","202","4","-","06","\n","Current"," date",":"," ","202","5","-","09","-","18","\n\n","Reason","ing",":"," low","\n\n","#"," Valid"," channels",":"," analysis",","," commentary",","," final","."," Channel"," must"," be"," included"," for"," every"," message",".","<|end|>","<|start|>","user","<|message|>","Write"," a"," Python"," program"," that"," takes"," a"," text"," file"," as"," input",","," performs"," le","mmat","ization"," on"," its"," contents"," using"," a"," NLP"," library",","," and"," outputs"," the"," processed"," text"," to"," a"," new"," file","."," The"," program"," should"," be"," capable"," of"," handling"," multiple"," text"," files"," and"," should"," include"," error"," handling"," for"," cases"," where"," the"," input"," file"," is"," not"," found"," or"," the"," le","mmat","ization"," library"," fails"," to"," process"," the"," text","."," Additionally",","," the"," program"," should"," provide"," options"," for"," the"," user"," to"," specify"," the"," output"," file"," name"," and"," the"," language"," of"," the"," input"," text",","," which"," will"," affect"," the"," le","mmat","ization"," algorithm"," used",".","<|end|>","<|start|>","assistant","<|channel|>","analysis","<|message|>","Need"," to"," provide"," code"," and"," explanation","."," Use"," spa","Cy","."," Handle"," multiple"," files","."," Options"," via"," argparse","."," Include"," error"," handling","."," Provide"," sample"," usage",".","<|end|>","<|start|>","assistant","<|channel|>","final","<|message|>","**","Python"," script"," –"," `","lemm","at","izer",".py","`","**\n\n","```","python","\n","#!/","usr","/bin","/env"," python","3","\n","\"\"\"\n","lemm","at","izer",".py","\n\n","A"," small"," command","‑","line"," tool"," that"," le","mmat","izes"," one"," or"," more"," text"," files"," and"," writes","\n","the"," result"," to"," a"," new"," file"," (","or"," to"," stdout",").\n\n","Features","\n","--------\n","*"," Accept","s"," any"," number"," of"," input"," files",".\n","*"," Lets"," the"," user"," choose"," the"," output"," file"," **","per"," input"," file","**"," (","or"," a"," common"," destination",").\n","*"," Allows"," the"," user"," to"," specify"," the"," language"," (`","en","`,"," `","de","`,"," `","es","`,"," …",")"," –"," the"," chosen","\n"," "," language"," determines"," which"," spa","Cy"," model"," is"," loaded",".\n","*"," Handles"," missing"," files",","," download"," errors",","," and"," other"," exceptions"," gracefully",".\n","\"\"\"\n\n","import"," argparse","\n","import"," pathlib","\n","import"," sys","\n","import"," re","\n","from"," typing"," import"," Iterator","\n\n","#"," ----------------------------------------------------------------","-----------"," #\n","#"," Helper"," –"," spa","Cy"," model"," loader"," --------------------------------","--------------"," #\n","#"," ----------------------------------------------------------------","-----------"," #\n","def"," load","_sp","acy","_model","(lang",":"," str","):\n"," "," \"\"\"\n"," "," Loads"," a"," spa","Cy"," language"," model"," for"," the"," given"," language"," code",".\n"," "," If"," the"," model"," is"," not"," present"," on"," disk",","," it"," will"," be"," downloaded"," automatically","\n"," "," (","the"," first"," time"," it"," is"," used",").\n\n"," "," Parameters","\n"," "," ----------\n"," "," lang"," :"," str","\n"," "," Two","‑","letter"," ISO","‑","639","‑","1"," language"," code"," ('","en","',"," '","de","',"," '","es","',"," ...",").\n\n"," "," Returns","\n"," "," -------\n"," "," n","lp"," :"," sp","acy",".language",".Language","\n"," "," The"," loaded"," language"," model",".\n\n"," "," Raises","\n"," "," ----","--\n"," "," Runtime","Error","\n"," "," If"," the"," requested"," language"," model"," cannot"," be"," loaded",".\n"," "," \"\"\"\n"," "," try",":\n"," "," import"," sp","acy","\n"," "," except"," Import","Error"," as"," e",":\n"," "," raise"," Runtime","Error","(\"","spa","Cy"," is"," not"," installed","."," \"\n"," "," \"","Install"," it"," with"," '","pip"," install"," sp","acy","'","\")"," from"," e","\n\n"," "," model","_alias","es"," ="," {\n"," "," '","en","':"," '","en","_core","_web","_sm","',\n"," "," '","de","':"," '","de","_core","_news","_sm","',\n"," "," '","es","':"," '","es","_core","_news","_sm","',\n"," "," '","fr","':"," '","fr","_core","_news","_sm","',\n"," "," '","it","':"," '","it","_core","_news","_sm","',\n"," "," #"," add"," more"," mappings"," if"," you"," need"," more"," languages","\n"," "," }\n\n"," "," if"," lang"," not"," in"," model","_alias","es",":\n"," "," raise"," Runtime","Error","(f","\"","Unsupported"," language"," code",":"," '{","lang","}'."," \"\n"," "," f","\"","Supported"," codes",":"," {","',"," '.","join","(model","_alias","es",")}","\")\n\n"," "," model","_name"," ="," model","_alias","es","[","lang","]\n\n"," "," try",":\n"," "," n","lp"," ="," sp","acy",".load","(model","_name",")\n"," "," except"," O","SError"," as"," exc",":\n"," "," #"," model"," not"," found"," –"," attempt"," to"," download"," it","\n"," "," print","(f","\"","spa","Cy"," model"," '{","model","_name","}'"," not"," found"," locally","."," \"\n"," "," f","\"","Attempt","ing"," to"," download","...\","," file","=sys",".stderr",")\n"," "," try",":\n"," "," import"," subprocess",","," sys","\n"," "," subprocess",".run","(\n"," "," [","sys",".ex","ecutable",","," \"-","m","\","," \"","sp","acy","\","," \"","download","\","," model","_name","],\n"," "," check","=True","\n"," "," )\n"," "," n","lp"," ="," sp","acy",".load","(model","_name",")\n"," "," except"," Exception"," as"," e",":\n"," "," raise"," Runtime","Error","(\n"," "," f","\"","Failed"," to"," download"," or"," load"," spa","Cy"," model"," '{","model","_name","}'","\")"," from"," e","\n\n"," "," return"," n","lp","\n\n","#"," ----------------------------------------------------------------","-----------"," #\n","#"," Lem","mat","ization"," logic"," ------------------------------------------------","------"," #\n","#"," ----------------------------------------------------------------","-----------"," #\n","def"," le","mmat","ize","_text","(text",":"," str",","," n","lp",")"," ->"," str",":\n"," "," \"\"\"\n"," "," Lem","mat","izes"," the"," given"," text"," using"," spa","Cy",".\n\n"," "," Parameters","\n"," "," ----------\n"," "," text"," :"," str","\n"," "," Raw"," text"," to"," le","mmat","ize",".\n"," "," n","lp"," :"," sp","acy",".language",".Language","\n"," "," Loaded"," spa","Cy"," model",".\n\n"," "," Returns","\n"," "," -------\n"," "," str","\n"," "," Text"," where"," each"," token"," has"," been"," replaced"," by"," its"," lemma",".\n"," "," \"\"\"\n"," "," doc"," ="," n","lp","(text",")\n\n"," "," #"," Keep"," the"," original"," whitespace",","," but"," replace"," each"," token"," with"," its"," lemma",".\n"," "," #"," spa","Cy","'s"," doc"," object"," preserves"," token"," boundaries",".\n"," "," lem","mas"," ="," []\n"," "," for"," token"," in"," doc",":\n"," "],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Chat","maxValue":310.75,"maxValueTokenIndex":553,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,73,62.8125,34.40625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,69.875,0,0,0,0,0,0,0,70.5,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,74.625,255.25,22.859375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,128.25,0,0,0,0,0,34,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,60.09375,0,57.78125,0,55.71875,0,23.296875,40.375,0,0,0,0,0,0,0,0,55.1875,49.625,0,31.1875,70.75,279.25,255,47.3125,65.9375,0,0,0,0,0,0,111.4375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,64.5625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,189.875,148.25,23.640625,0,0,0,0,0,26.40625,0,0,44.5,35.65625,211.875,190,78.125,0,0,0,96.125,0,0,71.625,88.0625,95.3125,265,165,240.5,46.15625,77.75,0,40.5,0,0,0,0,85.9375,232.25,37.75,0,69.25,59.21875,31,0,94.625,0,51.9375,111.5625,30.203125,0,43.0625,0,28.828125,30.203125,0,85.8125,33.9375,0,0,0,0,0,0,0,0,56.5,0,0,0,0,0,0,0,0,0,0,62.625,0,35.40625,0,0,63.65625,0,117.8125,0,0,0,0,0,0,0,0,26.03125,0,55.21875,0,0,57,172.625,0,29.328125,208,98.5625,99.5625,0,0,56.71875,37.125,133.125,195.125,0,0,0,0,0,0,0,0,0,0,0,0,0,56.375,0,76.9375,149.375,0,53.34375,56,0,0,0,49.625,0,0,93,0,41.8125,220.625,0,0,0,0,0,0,0,0,0,0,0,0,0,65.875,131.5,0,0,0,0,0,0,0,0,0,0,0,0,0,0,232.5,0,0,0,0,0,61.375,208,25.53125,0,0,0,59,0,92.8125,25.234375,161.875,165,310.75,243.75,189.5,88,0,0,23.421875,0,144.5,56.75,197,212.25,127.8125,28.34375,0,24.546875,0,0,101.5,55.0625,243.25,194.75,68.625,0,72.1875,33.75,0,0,112.3125,27.453125,0,160.125,67.75,0,0,38.9375,0,0,59.25,0,66.4375,174.375,68.3125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,147,0,0,0,0,0,0,0,0,0,0,32.28125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,82.5625,0,0,0,0,56.65625,164.375,98.625,0,102.375,0,0,0,0,35,55.1875,0,0,107.1875,31.65625,152.625,0,0,163.75,213.625,75.0625,98.75,70.5,0,0,0,32.71875,0,0,0,0,0,159,0,38.15625,0,0,45.6875,96.9375,82.8125,0,32.6875,0,0,0,0,166.25,152.375,30.265625,34.71875,29.40625,48.25,0,34.125,24.53125,0,0,0,0,0,0,0,42.625,67.6875,0,0,0,0,0,0,0,0,56.65625,0,0,0,0,0,0,0,0,0,0,0,0,116.125,0,0,0,0,0,0,58,234.25,0,82.6875,184.5,37.71875,151.75,77.9375,0,0,0,0,0,0,0,40.375,22.84375,81.6875,0,0,133.875,158.875,0,92.25,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,28.28125,0,152,88.8125,0,0,0,0,0,0,0,0,0,0,0,44.25,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,30.765625,138,0,0,0,0,0,0,0,0,0,0,0,0,0,0,40.875,160.875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,25.96875,140.75,0,26.84375,117.6875,72.0625,105.1875,0,0,33.84375,0,148,130.625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,23.390625,0,0,0,112.25,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,86.125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"w1dr06aqn12b51zpkgorzfaf","tokens":["<|start|>","system","<|message|>","You"," are"," Chat","GPT",","," a"," large"," language"," model"," trained"," by"," Open","AI",".\n","Knowledge"," cutoff",":"," ","202","4","-","06","\n","Current"," date",":"," ","202","5","-","09","-","18","\n\n","Reason","ing",":"," medium","\n\n","#"," Valid"," channels",":"," analysis",","," commentary",","," final","."," Channel"," must"," be"," included"," for"," every"," message",".","<|end|>","<|start|>","user","<|message|>","Is"," it"," possible"," to"," write"," a"," python"," code"," that"," detects"," Inter","jections"," in"," a"," text"," file"," \n","and"," highlights"," them"," by"," placing"," a"," \"[","{","(","Inter","jection",")}","]\""," suffix"," before"," them"," in"," an"," output"," file","?","<|end|>","<|start|>","assistant","<|channel|>","analysis","<|message|>","We"," need"," to"," produce"," Python"," code"," that"," detects"," inter","jections"," in"," a"," text"," file"," and"," highlights"," them"," by"," placing"," a"," \"[","{","(","Inter","jection",")}","]\""," suffix"," before"," them"," in"," an"," output"," file","."," The"," question",":"," \"","Is"," it"," possible"," to"," ...","?\""," They"," want"," code","."," So"," answer",":"," yes",","," here's"," sample"," code",","," using"," N","LT","K"," or"," regex","."," We"," should"," discuss"," inter","jection"," detection",":"," simple"," approach",":"," maintain"," list"," of"," common"," inter","jections","."," But"," we"," can"," also"," use"," POS"," tag","ger"," in"," N","LT","K"," to"," detect"," inter","jections"," (","tag"," '","UH","')."," So"," code",":"," read"," input"," file",","," tokenize",","," pos"," tag",","," then"," rewrite"," token"," with"," preceding"," suffix","."," Then"," output"," to"," file","."," Also"," show"," usage",","," maybe"," read"," from"," command"," line","."," We'll"," provide"," sample"," code"," in"," python"," with"," N","LT","K"," usage","."," Also"," mention"," requirement",":"," pip"," install"," nltk",","," nltk",".download","('","punkt","'),"," '","aver","aged","_per","ce","ptr","on","_t","agger","',"," '","tree","bank","',"," maybe"," '","words","'.\n\n","We"," can"," also"," note"," more"," sophisticated",":"," use"," spa","Cy"," with"," part","-of","-s","peech"," tag"," '","INT","J","'"," for"," inter","jections",".\n\n","The"," code",":"," read"," file",","," strip"," newline",","," tokenize"," sentences",","," then"," tokens","."," For"," each"," token",","," if"," tag"," indicates"," inter","jection",","," place"," suffix"," before"," token","."," Eg",":"," \"","Wow","!"," You"," did"," it",".\""," ->"," output",":"," \","," [{","(","Inter","jection",")}","]","Wow","!"," You"," did"," it",".\""," Wait",","," suffix"," before"," them","."," So"," \"","Wow","\""," preceded"," by"," \"[","{","(","Inter","jection",")}","]","\"."," Actually"," requirement",":"," suffix"," before"," them",":"," Let's"," interpret",":"," \"","by"," placing"," a"," \"[","{","(","Inter","jection",")}","]\""," suffix"," before"," them"," in"," an"," output"," file","\"."," In"," text"," that"," means"," preceding"," the"," inter","jection"," word","."," So"," output",":"," \"[","{","(","Inter","jection",")}","]"," Wow","\"\n\n","So"," code",":"," in"," tokens",","," for"," each"," inter","jection"," token",","," produce"," \"[","{","(","Inter","jection",")}","]"," \""," +"," token","."," Then"," join"," to"," output","."," Or"," produce"," whole"," text","."," Also"," newline"," and"," punctuation","."," Use"," token","ization"," accordingly",".\n\n","Will"," provide"," code"," that"," uses"," spa","Cy",":\n\n","``","`\n","import"," sp","acy","\n\n","nl","p"," ="," sp","acy",".load","(\"","en","_core","_web","_sm","\")\n","with"," open","(in","file",","," '","r","',"," encoding","='","utf","8","')"," as"," f",","," open","(outfile",","," '","w","',"," encoding","='","utf","8","')"," as"," out",":\n"," "," doc"," ="," n","lp","(f",".read","())\n"," "," out",".write","('","'.","join","(f","'","[{"," \"(","Inter","jection",")\""," }]"," '"," if"," token",".pos","_"," =="," \"","INT","J","\""," else"," token",".text"," if"," not"," token",".is","_space"," else"," '"," '"," for"," token"," in"," doc","))\n","``","`\n\n","But"," careful",":"," token",".text"," will"," include"," punctuation","."," Build"," output"," string",":"," iterate"," doc",","," for"," each"," token",","," if"," it's"," inter","jection"," and"," not"," punctuation",","," add"," prefix","."," But"," token",".is","_p","unct"," remains"," part"," of"," original",","," do"," not"," modify","."," But"," we"," want"," to"," keep"," spacing","."," Might"," use"," token",".wh","itespace","_"," attribute",".\n\n","Simpl","er",":"," iterate"," tokens",","," build"," string",","," each"," token",":\n\n","``","`\n","if"," token",".pos","_"," =="," \"","INT","J","\":\n"," "," out",".write","(\"[","{","(","Inter","jection",")}","]"," \")\n","output","_text"," +="," token",".text"," +"," token",".wh","itespace","_\n","``","`\n\n","Spa","Cy","'s"," token",".wh","itespace","_"," prints"," trailing"," whitespace",".\n\n","Alternatively"," use"," N","LT","K"," tag",":"," simpler"," to"," maintain"," lex","icon","."," But"," spa","Cy"," is"," robust",".\n\n","We"," can"," include"," both"," options",":"," with"," N","LT","K"," which"," uses"," tag"," '","UH","',"," and"," with"," spa","Cy","."," Provide"," code"," to"," read"," file"," and"," output"," processed","."," Provide"," explanation","."," Also"," mention"," possibility"," to"," detect"," inter","jections"," by"," maintaining"," a"," list",".\n\n","We"," can"," present"," code",".\n\n","Also"," can"," highlight"," with"," python","."," Provide"," typical"," usage",":"," my","script",".py"," input",".txt"," output",".txt","\n\n","Also"," mention"," if"," wanting"," to"," ignore"," capital","ized"," inter","jections"," at"," beginning"," of"," sentence",":"," but"," may"," be"," part"," of"," proper"," nouns","."," But"," sp","acy"," will"," treat"," \"","I","\""," as"," PR","ON"," not"," INT","J",".\n\n","Ok","."," Let's"," produce"," final"," answer"," with"," code",".","<|end|>","<|start|>","assistant","<|channel|>","final","<|message|>","Absolutely","—","Python"," makes"," this"," a"," one","‑","liner"," from"," an"," engineering"," point"," of"," view","."," \n","Below"," are"," **","two"," complete",","," ready","‑","to","‑","run"," examples","**"," that"," read"," a"," plain","‐","text"," file",",\n","spot"," every"," inter","jection",","," prepend"," the"," marker"," `","[{","(","Inter","jection",")}","]","`"," in"," front"," of"," it",",\n","and"," write"," the"," transformed"," text"," to"," a"," new"," file",".\n\n","*","The"," two"," approaches"," are",":","*\n\n","1","."," **","Spa","Cy","**"," –"," uses"," a"," statistical"," POS"," tag","ger"," (`","INT","J","`"," ="," “","Inter","jection","”)."," \n","2","."," **","NL","TK","**"," –"," uses"," the"," classic"," Penn"," Tree","bank"," tag"," `","UH","`"," (","inter","jection",")"," and"," a"," small","\n"," "," hand","‑","crafted"," list"," of"," common"," inter","jections",".\n\n","Choose"," the"," one"," that"," best"," suits"," your"," setup",";"," both"," are"," safe"," to"," drop"," into"," any","\n","Python"," ","3",".","10","+"," script"," or"," J","upyter"," notebook",".\n\n","---\n\n","##"," ","1","."," Spa","Cy"," version"," "," (","recommended"," for"," production",")\n\n","###"," Install"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Chat","maxValue":309.75,"maxValueTokenIndex":504,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,72.9375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,49.25,33.5,0,0,69.75,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,34.21875,0,81.875,0,0,0,0,0,0,0,0,115.875,0,132.75,167.5,212.375,60.5,72.5625,103,106.3125,82.125,0,0,53.5,132.5,0,78.5625,100.5,132.5,31.625,44.96875,56.34375,48.34375,106,0,63.65625,0,0,0,0,0,0,0,0,66.9375,200.625,78.25,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,36.65625,180.875,24.90625,0,38.1875,0,0,238.125,29.546875,0,125.5625,58.15625,0,143.75,238.75,206.25,43.75,309.75,88.875,226.75,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,107.625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,104.875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,138.125,28.140625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,121.125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,100.0625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,28.375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,41.625,169.375,0,24.203125,40.46875,56.375,70.25,0,0,68.8125,64.0625,0,0,0,0,0,0,0,0,0,0,0,0,0,50.84375,0,0,0,0,0,28.3125,0,28.953125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,184.625,0,0,0,0,56.28125,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"fc395gplo6ncvzd7xqjpg8tp","tokens":["<|start|>","system","<|message|>","You"," are"," Chat","GPT",","," a"," large"," language"," model"," trained"," by"," Open","AI",".\n","Knowledge"," cutoff",":"," ","202","4","-","06","\n","Current"," date",":"," ","202","5","-","09","-","18","\n\n","Reason","ing",":"," low","\n\n","#"," Valid"," channels",":"," analysis",","," commentary",","," final","."," Channel"," must"," be"," included"," for"," every"," message",".","<|end|>","<|start|>","user","<|message|>","Provide"," a"," comprehensive"," description"," of"," a"," real","-life"," scenario"," where"," machine"," learning"," has"," been"," successfully"," implemented"," for"," improving"," natural"," language"," processing","."," Include"," specific"," details"," such"," as"," the"," type"," of"," data"," used",","," the"," machine"," learning"," models"," applied",","," the"," challenges"," faced",","," and"," the"," outcomes"," achieved",".","<|end|>","<|start|>","assistant","<|channel|>","analysis","<|message|>","Need"," detailed"," case"," study",".","<|end|>","<|start|>","assistant","<|channel|>","final","<|message|>","###"," Real","‑","Life"," Scenario",":"," Convers","ational"," AI"," for"," Healthcare"," Appointment"," Scheduling"," \n","*","Institute",":*"," University"," of"," Washington"," ","—"," ","Department"," of"," Biomedical"," Informat","ics"," \n","*","Project",":*"," **","C","aring","Bot","**"," –"," an"," AI"," assistant"," that"," interpre","ts"," patient"," voice"," and"," text"," messages"," and"," schedules"," appointments"," with"," primary","‑","care"," physicians","."," \n\n","---\n\n","##"," ","1","."," Problem"," Statement","\n\n","-"," **","Clinical"," Pain"," Point","**",":"," Over"," ","30"," ","%"," of"," primary","‑","care"," visits"," were"," booked"," via"," telephone"," call",","," causing"," long"," waiting"," times",","," provider"," frustration",","," and"," scheduling"," errors","."," \n","-"," **","Goal","**",":"," Reduce"," call"," volume"," by"," ","50"," ","%"," and"," average"," booking"," time"," from"," ","12"," ","min"," to"," ≤","2"," ","min"," while"," maintaining"," high"," accuracy"," (","≥","97"," ","%"," correct"," intent"," detection",").\n\n","---\n\n","##"," ","2","."," Data"," Collection"," &"," Preparation"," \n\n","|"," Data"," Type"," |"," Source"," |"," Volume"," (","Sept"," ","202","3","‑","Feb"," ","202","4",")"," |"," Key"," Features"," |\n","|","-----------","|","--------","|","----------------","------------","|","--------------","|\n","|"," **","Text","**"," |"," Logged"," ","1",".","2"," ","M"," patient"," messages"," received"," via"," secure"," portal"," (","patient"," portal",","," email",","," and"," SMS",")."," |"," ","1"," ","million"," messages"," |"," “","Schedule"," flu"," shot","”,"," “","Need"," to"," postpone"," appointment","”,"," “","When"," is"," my"," next"," check","‑","up","?”"," |\n","|"," **","Speech","**"," |"," ","50",",","000"," spoken"," requests"," from"," call"," center"," (","man","ually"," archived",","," anonym","ized",")."," |"," ","50"," ","k"," audio"," files"," |"," ","1","–","3"," ","min",","," ","16"," ","k","Hz",","," ~","30"," ","k"," transcripts"," |\n","|"," **","Metadata","**"," |"," Appointment"," history",","," patient"," demographics"," (","age",","," gender",","," insurance"," type","),"," provider"," availability"," schedule","."," |"," ","200"," ","k"," rows"," |"," Time"," slots",","," patient"," no","‑","show"," propensity"," scores"," |\n\n","###"," Annotation"," Workflow"," \n\n","1","."," **","Int","ents","**",":"," ","12"," intents"," (","Schedule",","," Res","chedule",","," Cancel",","," Request"," Information",","," Insurance",","," etc",".)."," \n","2","."," **","Entities","**",":"," Date","/","Time",","," Reason"," for"," visit",","," Physician"," ID",","," Insurance"," plan","."," \n","3","."," **","Annot","ators","**",":"," Mixed"," team"," of"," ","30"," trained"," nurses"," +"," ","10"," data"," scientists","."," \n","4","."," **","Tools","**",":"," Pro","dig","y"," +"," custom"," annotation"," platform",","," with"," active"," learning"," loop","."," \n","5","."," **","Quality"," Control","**",":"," Inter","‑","annot","ator"," agreement"," (","C","ohen","’s"," κ",")"," >"," ","0",".","86"," across"," all"," intents",".\n\n","---\n\n","##"," ","3","."," Modeling"," Stack"," \n\n","|"," Stage"," |"," Model","(s",")"," |"," Reason","ing"," |"," Implementation"," Details"," |\n","|","-------","|","----------","|","-----------","|","----------------","--------","|\n","|"," **","Speech","‑","to","‑","Text"," (","ST","T",")**"," |"," **","Kal","di","**"," with"," a"," fine","‑","t","uned"," **","wav","2","vec"," ","2",".","0","**"," encoder"," (","pre","‑","trained"," on"," ","500"," ","h"," medical"," corpus",")"," |"," Domain","‑","specific"," acoustic"," model"," reduces"," O","OV"," for"," medical"," terms"," |"," Beam"," search"," width"," ","20",","," resc","oring"," with"," a"," ","5","‑","gram"," LM"," |\n","|"," **","Text"," Input","**"," |"," **","B","ERT","‑","based","**"," models"," (","domain","‑","specific",")"," |"," Superior"," contextual"," embeddings"," for"," short"," medical"," utter","ances"," |"," Ru","GPT","‑","3"," (","Medical",")"," –"," ","350","M"," params",","," fine","‑","t","uned"," on"," ","1"," ","M"," messages"," |\n","|"," **","Intent"," Classification","**"," |"," **","Fast","Text","**"," (","word","‑","embedding"," bag","‑","of","‑","words",")"," +"," **","Conditional"," Random"," Fields"," (","CR","F",")**"," |"," Fast"," inference"," (","≤","5"," ","ms",")"," &"," handles"," out","‑","of","‑","v","ocabulary"," words"," with"," sub","‑","token"," features"," |"," Ensemble"," with"," B","ERT"," →"," majority"," voting"," |\n","|"," **","Entity"," Extraction","**"," |"," **","spa","Cy","**"," transformer"," pipeline"," (","en","‑","core","\\","_","md",")"," +"," NL","Me","ch"," for"," nested"," entities"," |"," Handles"," multi","‑","word"," expressions"," &"," human","‑","read","able"," constraints"," |"," Word","‑","piece"," token"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Chat","maxValue":300.5,"maxValueTokenIndex":808,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,32.46875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,71.875,208.25,35.4375,46.21875,119.5625,67.8125,86.3125,109,300.5,107.875,235,168,64.0625,0,0,0,32.96875,24.328125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"rg737irj0mfzwva5wyvb6nak","tokens":["<|startoftext|>","In"," my"," role"," as"," European"," Studies"," Lia","ison",","," one"," of"," my"," priorities"," is"," to"," assist"," people"," in"," their"," digital"," humanities"," work","."," In"," that"," work",","," I"," have"," found"," a"," glaring"," gap"," in"," tools"," that"," support"," multilingual"," and"," non","-English"," materials",","," particularly"," those"," that"," focus"," on"," natural"," language"," processing"," (","N","LP",")."," Much"," of"," the"," work"," that"," has"," been"," done"," using"," NLP"," has"," been"," focused"," on"," an"," Ang","loc","entric"," model",","," using"," English"," texts"," in"," conjunction"," with"," tools"," and"," computer"," models"," that"," are"," primarily"," designed"," to"," work"," with"," the"," English"," language","."," I"," wanted"," to"," make"," it"," easier"," for"," people"," to"," begin"," engaging"," with"," non","-English"," materials"," within"," the"," context"," of"," their"," NLP"," and"," digital"," humanities"," work",","," so"," I"," created"," Roz","ha",".\n","Roz","ha",","," a"," Python"," package"," designed"," to"," simplify"," multilingual"," natural"," language"," processing"," (","N","LP",")"," processes"," and"," pipelines",","," was"," recently"," released"," on"," Git","Hub"," and"," Py","PI"," under"," the"," GNU"," General"," Public"," License",","," allowing"," users"," to"," use"," and"," contribute"," to"," the"," tool"," with"," minimal"," limitations","."," The"," package"," includes"," functions"," to"," perform"," a"," wide"," variety"," of"," NLP"," processes"," using"," over"," ","70"," languages",","," from"," stop","word"," removal"," to"," sentiment"," analysis"," and"," many"," more",","," in"," addition"," to"," visual","izations"," of"," the"," analyzed"," texts","."," It"," also"," allows"," users"," to"," choose"," from"," N","LT","K",","," spa","Cy",","," and"," St","anza"," for"," many"," of"," the"," processes"," it"," can"," perform",","," allowing"," for"," easy"," comparison"," of"," the"," output"," from"," each"," library","."," Examples"," of"," the"," code"," being"," used"," can"," be"," seen"," here",".\n","While"," the"," project"," first"," grew"," out"," of"," the"," needs"," of"," researchers"," and"," graduate"," students"," working"," at"," UT","-A","ustin"," who"," were"," interested"," in"," exploring"," NLP"," and"," the"," digital"," humanities"," using"," non","-English"," languages"," but"," who"," did"," not"," have"," very"," much"," prior"," coding"," experience",","," its"," code"," also"," aims"," to"," streamline"," NLP"," work"," for"," those"," with"," more"," technical"," knowledge"," by"," simplifying"," and"," shortening"," the"," amount"," of"," code"," they"," need"," to"," write"," to"," accomplish"," tasks","."," Output"," from"," the"," package","’s"," functions"," can"," be"," integrated"," into"," more"," complex"," and"," nuanced"," workflows",","," allowing"," users"," to"," use"," the"," tool"," to"," perform"," standard"," tasks"," like"," word"," token","ization"," and"," then"," use"," the"," response"," for"," their"," other"," work",".\n","The"," package"," is"," written"," in"," Python"," for"," a"," variety"," of"," reasons","."," Python"," has"," a"," wide"," base"," of"," users"," that"," makes"," it"," easy"," to"," share"," with"," others",","," and"," which"," helps"," ensure"," that"," it"," will"," be"," used"," widely","."," It"," also"," helps"," ensure"," that"," people"," will"," contribute"," to"," the"," project",","," building"," upon"," its"," existing"," code","."," F","ost","ering"," contributions"," for"," multilingual"," digital"," humanities"," and"," NLP"," can"," help"," broaden"," the"," community"," of"," scholars",","," cod","ers"," and"," researchers"," working"," with"," these"," multilingual"," materials",","," which"," will"," broaden"," the"," community"," in"," general"," while"," also"," improving"," the"," package","."," Python"," is"," also"," very"," commonly"," used"," for"," NLP"," applications",","," and"," the"," packages"," integrated"," into"," Roz","ha"," all"," have"," robust"," communities"," of"," their"," own","."," This"," allows"," for"," users"," to"," connect"," with"," other"," communities"," as"," well",","," and"," to"," explore"," these"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Non-Chat","maxValue":239.875,"maxValueTokenIndex":230,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,23.265625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,39.1875,106.5625,0,116.1875,239.875,31.015625,0,41.40625,130.5,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,55.1875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,37.28125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"nb6z13t9gp3fafnuee058j32","tokens":["<|startoftext|>","On"," April"," ","23",","," ","201","8",","," Google"," announced"," the"," open","-source"," projects"," that"," will"," participate"," in"," Google"," Summer"," Of"," Code"," ","201","8","."," GF","OSS"," participates"," this"," year"," with"," ","10"," open"," source"," projects",","," and"," students"," who"," will"," successfully"," complete"," the"," program"," will"," be"," rewarded"," with"," stip","ends"," for"," their"," contributions",".\n","G","So","C"," offers"," students"," from"," around"," the"," world"," the"," opportunity"," to"," contribute"," to"," a"," software"," project",","," and"," to"," learn"," how"," to"," work"," in"," an"," open"," source"," software"," development"," environment","."," Every"," summer",","," thousands"," of"," students"," from"," around"," the"," world"," participate"," in"," the"," G","So","C",","," contributing"," to"," the"," development"," of"," open"," source"," projects",".\n","The"," ","10"," open","-source"," projects"," to"," be"," developed"," within"," GS","OC"," ","201","8"," are",":\n","-"," Adding"," Greek"," language"," on"," NLP"," library"," Sp","acy",".io","\n","Sp","acy"," is"," an"," open","-source"," Python"," library"," for"," advanced"," Natural"," Language"," Processing","."," Adding"," the"," Greek"," language"," will"," provide"," massive"," improvements"," on"," applying"," NLP"," on"," the"," Greek"," language",","," and"," allow"," for"," actions"," as"," Named"," entity"," recognition"," and"," Part","-of","-s","peech"," tagging","\n","The"," objective"," of"," this"," project"," is"," to"," extend"," existing"," Government"," Gazette","(G","G",")"," text"," mining"," code"," with"," Named"," Entity"," Recognition"," features"," that"," will"," allow"," the"," identification"," of"," Government"," Director","ates"," and"," Div","isions"," with"," the"," responsibilities"," assigned"," to"," them"," and"," the"," types"," of"," services"," they"," are"," required"," to"," provide"," according"," with"," their"," legal"," framework"," published"," in"," http","://","www",".et",".gr","/"," and"," the"," extraction"," of"," this"," information"," with"," related"," metadata"," (","decision"," number",","," date"," of"," the"," GG"," issue",").\n","E","pop","tes"," (","Ε","πό","π","της"," –"," a"," Greek"," word"," for"," overse","er",")"," is"," an"," open"," source"," computer"," lab"," management"," and"," monitoring"," tool","."," It"," allows"," for"," screen"," broadcasting"," and"," monitoring",","," remote"," command"," execution",","," message"," sending",","," imposing"," restrictions"," like"," screen"," locking"," or"," sound"," mut","ing"," the"," clients"," and"," much"," more","."," The"," objective"," of"," thi","w"," project"," is"," to"," rewrite"," E","pop","tes"," with"," Python"," ","3"," and"," Gtk","3"," with"," G","Object"," Int","rospection"," support","\n","The"," objective"," of"," this"," project"," is"," to"," extend"," existing"," Government"," Gazette"," text"," mining"," code"," to"," cross","-link"," legal"," texts"," and"," detect"," the"," ministers"," that"," sign"," them",".\n","Libre","Office"," customization"," in"," order"," to"," achieve"," a"," “","f","amiliar","”"," look"," and"," menus"," for"," users"," that"," convert"," from"," MS"," Office"," ","201","3",","," and"," creation"," of"," specific"," templates"," for"," the"," Greek"," Legal"," system",".\n","A"," web","-based"," system"," to"," manage"," data"," on"," software"," components"," and"," their"," relations","."," Ment","ors",":"," Alex","ios"," Z","avras"," Georgia"," Kap","its","aki","\n","WS","O","2"," Identity"," Server"," provides"," secure"," identity"," management"," for"," enterprise"," web"," applications",","," services",","," and"," APIs"," by"," managing"," identity"," and"," ent","itlements"," of"," the"," users"," securely"," and"," efficiently",".\n","The"," aim"," of"," this"," project"," is"," to"," create"," a"," new"," type"," of"," user","store"," where"," credentials"," will"," be"," se","pare","ted"," from"," attir","b","utes"," and"," attributes"," (","claims",")"," will"," be"," able"," to"," be"," configured"," from"," the"," web"," UI"," as"," a"," SOAP"," or"," REST"," web"," service",".\n","A"," collection"," of"," tools"," supporting"," penetration"," test","\n","-"," Addition"," of"," Greek"," glyph","s"," in"," the"," Open"," Source"," Fonts"," Ar","ima","Mad","urai","\n","-"," Addition"," of"," Greek"," glyph","s"," in"," the"," Open"," Source"," Fonts"," Work","Sans"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Non-Chat","maxValue":137.75,"maxValueTokenIndex":141,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,137.75,0,0,0,113.4375,0,0,0,0,0,52.8125,0,69.375,0,0,50.90625,0,0,0,0,121.1875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,25.203125],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"ivlwmuycujiy23bmpt5jwh9z","tokens":["<|startoftext|>","cu","atro",".","3","."," The"," latest"," fantasy"," running"," device","\n","Next",","," i"," establish"," the"," tool"," pre","-process"," for"," each"," and"," every"," dream"," statement"," (§","4",".","3",".","1","),"," then"," describes"," emails"," (§","4",".step"," ","3",".d","os",","," §","4",".step"," three",".","3","),"," societal"," affairs"," (§","cu","atro",".step"," three",".","4",")"," and"," you"," will"," emotion"," terms"," and"," conditions"," (§","4",".","3",".","5",")."," We"," decided"," to"," focus"," on"," these"," types"," of"," three"," dimensions"," out","-of"," the"," the"," ones"," as"," part"," of"," the"," Hall","way","–","Van"," de"," Palace"," programming"," program"," for"," a"," few"," grounds","."," First"," and"," foremost",","," this"," type"," of"," three"," size"," is"," said"," to"," be"," the"," initial"," of"," those"," in"," assisting"," the"," translation"," of"," fantasies",","," while"," they"," explain"," the"," fresh"," new"," spine"," off"," an"," aspiration"," patch"," :"," who"," had"," been"," present",","," and"," this"," methods"," was"," indeed"," did"," and"," which"," thoughts"," was"," in"," fact"," shown","."," Speaking"," of",","," indeed",","," the"," ","3"," proportions"," you"," to"," old","-fashioned"," small","-me","asure"," degree"," with"," the"," dream"," profile"," generally"," concerned"," about"," [","68","–","70","]."," ","2","nd",","," some"," of"," the"," leftover"," dimensions"," (","age",".g","."," profits"," and"," failure",","," luck"," and"," you"," will"," bad"," luck",")"," portray"," very"," contextual"," and"," you"," can"," possibly"," not"," clear"," basics"," that"," will"," be"," already"," tough"," to"," determine"," that"," have"," state","-of","-the","-art","work"," natural"," words"," running"," (","N","LP",")"," process",","," therefore"," we"," will"," recommend"," research"," into"," the"," heightened"," NLP"," gadgets"," because"," section"," of"," future"," functions",".\n","Contour"," dos","."," Application"," of"," the"," equipment"," in"," order"," to"," an"," illustration"," dream"," statement","."," The"," newest"," fantasy"," report"," comes"," from"," Dream","bank"," (§","4",".d","os",".","1",")."," The"," fresh"," new"," tool"," parses"," it"," because"," they"," build"," a"," tree"," of"," verbs"," (","V","BD",")"," and"," you"," may"," nouns"," (","NN",","," N","NP",")"," (§","4",".","3",".","1",")."," By"," using"," the"," a"," couple"," exterior"," degree"," angles",","," the"," latest"," device"," identifies"," someone",","," creature"," and"," you"," can"," imaginary"," emails"," one"," of"," many"," nouns"," (§","cu","atro",".","3",".","2",");"," class","ifies"," emails"," in"," terms"," of"," the"," sex",","," chat","spin"," ben","zeri"," uygul","amalar"," if"," they"," is"," actually"," dry",","," and"," you"," can"," if"," they"," is"," fictional"," (§","4",".step"," ","3",".","3",");"," makes"," reference"," to"," verbs"," you"," to"," show"," amic","able",","," competitive"," and"," you"," can"," intimate"," relations"," (§","cu","atro",".step"," three",".","4",");"," determines"," if"," or"," not"," each"," verb"," shows"," a"," relationships"," or"," otherwise"," not"," pred","icated"," on"," perhaps"," the"," two"," actors"," regarding"," verb"," (","this"," new"," noun"," preceding"," new"," verb"," and"," therefore"," following"," they",")"," was"," recognizable",";"," and"," you"," may"," identifies"," negative"," and"," positive"," feeling"," terminology"," having"," fun"," with"," Em","ole","x"," (§","cu","atro",".step"," three",".","5",").\n","cu","atro",".step"," three",".","1","."," Pre","processing","\n","Brand"," new"," equipment"," initial"," develops"," most"," of"," the"," most"," typical"," English"," contractions"," ","1"," (","el","izabeth",".g","."," ‘","I","’m","’"," to"," help"," you"," ‘","I"," am","’)"," that"," are"," found"," in"," the"," first"," fantasy"," declaration","."," That"," is"," completed"," to"," convenience"," the"," latest"," identity"," out"," of"," nouns"," and"," you"," may"," verbs","."," The"," equipment"," doesn","’t"," cure"," one"," stop","-","phrase"," or"," punctuation"," never"," to"," affect"," the"," after"," the"," step"," off"," synt","actical"," parsing",".\n","For"," the"," resulting"," text",","," the"," fresh"," new"," tool"," applies"," constituent","-founded"," investigation"," ,"," a"," strategy"," regularly"," fal","ter"," natural"," language"," text"," on"," the"," component"," parts"," which"," can"," up"," coming"," getting"," later"," on"," analysed"," on"," their"," own","."," Constitu","ents"," are"," categories"," of"," conditions"," operating"," because"," defined"," devices"," and"," therefore"," belong"," sometimes"," to"," ph","ras","al"," groups"," (","el","izabeth",".g","."," noun"," sentences",","," verb"," sentences",")"," or"," even"," to"," lexical"," groups"," (","el","izabeth",".g","."," nouns",","," verbs",","," adjectives",","," conjunction","s",","," ad","verbs",")."," Constitu","ents"," try"," iter","atively"," divided"," into"," sub","const","itu","ents",","," as"," a"," result"," of"," the"," level"," of"," private"," words","."," The"," consequence"," of"," this"," method"," try"," an"," excellent"," parse"," tree",","," specifically"," an"," effective"," dend","rogram"," whoever"," means"," is"," the"," very"," first"," phrase",","," sides"," are"," creation"," laws"," you"," to"," mirror"," the"," dwelling"," of"," your"," English"," grammar"," (","el","izabeth",".","grams","."," an"," entire"," sentence"," is"," broke"," up"," depending"," on"," the"," topic","–","predicate"," office","),"," nodes"," is"," constituents"," and"," you"," can"," sub","-","const","itu","ents",","," and"," you"," can"," simply"," leaves"," are"," personal"," words",".\n","Among"," most"," of"," the"," in"," public"," places"," available"," methods"," for"," constituent","-dependent"," research",","," all"," of"," our"," product"," incorporates"," the"," fresh"," Stanford","Parser"," on"," nltk"," python"," toolkit"," ,"," a"," commonly"," used"," condition","-of","-the","-","ways"," parser"," based"," on"," probabil","istic"," context","-t","ot","ally"," free"," gramm","ars"," ."," This"," new"," equipment"," outputs"," the"," parse"," tree"," and"," you"," may"," annot","ates"," nodes"," and"," you"," will"," actually"," leaves"," due"," to"," their"," involved"," lexical"," otherwise"," ph","ras","al"," classification"," (","ideal"," from"," contour"," ","2",").\n","After"," building"," the"," latest"," tree",","," by"," then"," applying"," the"," morphological"," setting"," mor","phy"," within"," the"," nltk",","," the"," fresh"," new"," equipment"," converts"," most"," of"," the"," words"," included"," in"," the"," tree","’s"," actually"," leaves"," for"," the"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Non-Chat","maxValue":86,"maxValueTokenIndex":779,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,86,57.65625,0,49.96875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,40.9375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"u2bw3sx7m35c6130nkk417xe","tokens":["<|startoftext|>","A"," construction"," can"," be"," defined"," as"," a"," form","-","meaning"," pairing"," in"," which"," the"," components"," cannot"," entirely"," explain"," the"," meaning"," of"," the"," whole","."," Construction","al"," phenomena"," range"," from"," mor","phe","mes"," to"," argument"," structure",","," and"," include"," obvious"," examples"," like"," coll","ocations"," (\"","her","met","ically"," sealed","\"),"," (","idi","omatic",")"," expressions"," with"," fixed"," constituents"," (\"","kick"," the"," bucket","\"),"," expressions"," with"," (","semi","-)","optional"," constituents"," (\"","hun","gry"," as"," a"," X","\"),"," and"," sequences"," of"," grammatical"," categories"," ([","det","][","adj","][","noun","]),"," as"," well"," as"," more"," complex"," constructions"," involving",","," e",".g",".,"," the"," occurrence"," of"," sentence"," composition"," features"," (","e",".g","."," trans","itivity",")"," or"," ad","verb","ial"," types"," (","e",".g","."," spatial"," ad","verb","ials",")."," As"," these"," examples"," demonstrate",","," constructions"," are"," a"," diverse"," breed",","," and"," construction","ist"," theories"," do"," not"," give"," a"," government"," to"," any"," specific"," level"," of"," language","."," On"," the"," contrary",","," all"," levels"," are"," viewed"," as"," equally"," important",".\n","Con","structions"," are"," currently"," enjoying"," considerable"," attention"," in"," linguistic"," research",","," and"," are"," now"," widely"," considered"," as"," being"," much"," more"," frequent"," and"," central"," to"," language"," than"," what"," has"," traditionally"," been"," acknowledged","."," Construction","ist"," theories"," emphasize"," that"," the"," human"," mind"," seems"," to"," prefer"," to"," use"," pref","abric","ated"," chunks"," of"," linguistic"," elements"," (","i",".e","."," constructions",")"," when"," possible",","," instead"," of"," generating"," sentences"," from"," scratch"," as"," in"," the"," gener","ative"," grammar"," approach","."," Con","structions"," are"," also"," gaining"," a"," central"," place"," in"," different"," kinds"," of"," computational"," lingu","istics"," applications",";"," examples"," include"," machine"," translation",","," information"," retrieval"," and"," extraction",","," tools"," for"," language"," learning",","," etc","."," Con","structions"," are"," an"," interesting"," and"," important"," phenomenon"," because"," they"," constitute"," a"," middle","way"," in"," the"," syntax","-","lex","icon"," continuum",","," and"," because"," they"," show"," great"," potential"," in"," tackling"," inf","am","ously"," difficult"," computational"," lingu","istics"," tasks"," like"," sentiment"," analysis"," and"," language"," acquisition",".\n","This"," workshop"," will"," encourage"," submissions"," in"," all"," aspects"," of"," constructions","-based"," research",","," including",":\n","The","oretical"," discussions"," on"," the"," nature"," and"," place"," within"," (","comput","ational",")"," linguistic"," theory"," of"," the"," concept"," of"," linguistic"," constructions",".\n","Methods"," and"," algorithms"," for"," identifying"," and"," extracting"," linguistic"," constructions"," (","coll","ocations",","," idi","oms",","," multi","word"," expressions",","," grammatical"," constructions",","," etc",".).\n","Uses"," and"," applications"," of"," linguistic"," constructions"," (","machine"," translation",","," information"," access",","," sentiment"," analysis",","," tools"," for"," language"," learning"," etc",".).\n","Submission"," deadline",":"," March"," ","1",","," ","201","0","\n","Notification"," of"," acceptance",":"," March"," ","30",","," ","201","0","\n","Camera"," ready"," papers",":"," April"," ","12",","," ","201","0","\n","Workshop",":"," June"," ","6",","," ","201","0","\n","NA","ACL"," H","LT"," ","201","0",","," Los"," Angeles",","," USA",".\n","We"," invite"," authors"," to"," submit"," papers"," via",":"," https","://","www",".soft","conf",".com","/","na","ac","lh","lt","201","0","/con","structions","/."," Sub","missions"," should"," be"," blind",","," avoid"," references"," to"," unpublished"," papers",","," not"," exceed"," ","8"," pages"," (","including"," references","),"," and"," should"," use"," the"," NA","ACL"," H","LT"," ","201","0"," style"," files",","," available"," at",":"," http","://","na","ac","lh","lt","201","0",".is","i",".edu","/auth","ors",".html","."," Each"," submission"," will"," be"," reviewed"," by"," two"," members"," of"," the"," program"," committee",".\n","Magn","us"," S","ahl","gren",","," S","ICS"," (","firstname",".lastname","@example",".org",")\n","O","la"," Kn","ut","sson",","," K","TH"," (","email","@example",".com",")\n","Benjamin"," Bergen",","," University"," of"," Hawaii",","," USA","\n","James"," Curr","an",","," University"," of"," Sydney",","," Australia","\n","Ste","fan"," E","vert",","," University"," of"," Os","n","abr","ück",","," Germany","\n","Charles"," Fill","more",","," University"," of"," Berkeley",","," USA","\n","Jonathan"," G","inz","burg",","," King's"," College",","," UK","\n","A","dele"," Goldberg",","," Princeton"," University",","," USA","\n","Ste","fan"," Th","."," Gr","ies",","," University"," of"," California",","," USA","\n","Matthew"," H","onn","ibal",","," University"," of"," Sydney",","," Australia","\n","J","ussi"," Karl","gren",","," Swedish"," Institute"," of"," Computer"," Science",","," Sweden"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Non-Chat","maxValue":84.25,"maxValueTokenIndex":657,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,84.25,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"i8ojaf5fi4a0dwv4cmwff64m","tokens":["<|startoftext|>","alph","asp","irit"," -"," Fot","olia","\n","Who"," grows"," up"," dreaming"," they'll"," be"," in"," charge"," of"," user","-generated"," content"," (","UG","C",")"," for"," a"," large"," retailer","?"," Not"," Matt"," Fisher",","," with"," an"," undergraduate"," degree"," in"," marketing"," and"," an"," interest"," in"," law","."," But"," the"," program"," manager"," for"," product"," reviews"," and"," ratings"," at"," Nord","strom"," Inc","."," recalls"," \"","fall","ing"," in"," love"," with"," data","\""," while"," working"," for"," Microsoft"," and"," Amazon","."," A"," year"," ago",","," he"," joined"," Nord","strom","'s"," product"," management"," and"," development"," organization",","," and"," is"," currently"," in"," charge"," of"," user","-generated"," content"," created"," on"," Nord","strom"," websites",".\n","\"","Anywhere"," our"," customers"," can"," leave"," a"," comment",","," upload"," a"," photo",","," ask"," a"," question",","," or"," find"," an"," answer"," to"," an"," already"," asked"," question"," is"," tagged"," as"," user","-generated"," content",",\""," Fisher"," said",".\n","The"," role"," isn't"," new",","," exactly"," --"," it's"," been"," around"," since"," ","200","9"," --"," but"," in"," the"," last"," year",","," it's"," gone"," from"," being"," part"," of"," Nord","strom","'s"," \"","voice"," of"," the"," customer","\""," team"," to"," a"," separate"," entity",","," said"," Fisher",","," who"," is"," slated"," to"," give"," a"," presentation"," at"," the"," Text"," Analytics"," Summit"," West"," this"," fall",".\n","In"," this"," Search","C","IO"," Business"," POV"," interview",","," Senior"," News"," Writer"," Nicole"," L","ask","owski"," sat"," down"," with"," Fisher"," to"," discuss"," the"," technology"," he's"," using"," --"," including"," Hadoop"," --"," to"," parse"," through"," tens"," of"," thousands"," of"," customer"," reviews","."," One"," lesson"," learned"," from"," mining"," user","-generated"," content","?"," Don't"," take"," five","-star"," customer"," product"," reviews"," at"," face"," value",".\n","You're"," working"," with"," a"," lot"," of"," text"," or"," un","structured"," data","."," What's"," the"," biggest"," hurdle"," for"," you","?\n","Matt"," Fisher",":"," We"," have"," millions"," and"," millions"," of"," rows"," of"," un","structured"," data"," in"," the"," form"," of"," free","-form"," text"," that's"," coming"," in"," from"," different"," areas",":"," It"," could"," be"," customer"," reviews",";"," it"," could"," be"," a"," question",";"," it"," could"," be"," through"," our"," Fore","See"," surveys"," online"," or"," we"," also"," use"," Opinion","Lab"," to"," aggregate"," content"," on"," the"," site",";"," it"," could"," be"," through"," our"," comment"," cards","."," We're"," trying"," to"," tie"," all"," of"," this"," together"," to"," get"," a"," better"," understanding"," of"," what"," our"," customers"," are"," saying"," --"," what"," are"," the"," themes"," and"," trends"," in"," the"," areas"," that"," are"," working"," great"," and"," in"," the"," areas"," that"," aren't"," working"," great",".\n","One"," problem",":"," We"," don't"," have"," an"," enterprise","-wide"," solution"," to"," do"," this","."," So"," trying"," to"," create"," a"," consistent"," and"," pragmatic"," process"," across"," the"," board"," has"," been"," one"," barrier","."," It's"," a"," big"," org",","," we"," have"," lot"," of"," people"," sitting"," in"," different"," teams",","," so"," creating"," consistency"," on"," how"," things"," are"," measured"," has"," been"," a"," problem",".\n","What's"," an"," example"," of"," an"," area"," that"," isn't"," working"," great","?\n","F","isher",":"," One"," specific"," project"," I'm"," working"," on"," is"," to"," better"," identify"," shipping"," issues"," and"," holes"," in"," our"," fulfillment"," process","."," We"," have"," fulfillment"," centers"," in"," the"," United"," States"," with"," one"," primary"," center"," in"," the"," Midwest","."," What"," I've"," been"," doing"," is"," looking"," at"," every"," [","customer","]"," review"," piece"," of"," content"," and"," every"," '","question"," content","'"," that"," comes"," in"," through"," our"," platform","."," We're"," analyzing"," to"," identify"," whether"," it's"," [","related"," to","]"," shipping"," or"," fulfillment"," or"," a"," product","."," We"," have"," specific"," flags"," we"," apply",".\n","Then"," we"," do"," sentiment"," analysis"," to"," determine"," if"," these"," customers"," are"," happy"," or"," upset","."," We"," found"," that",","," although"," some"," of"," our"," customers"," are"," unhappy",","," they're"," typically"," giving"," us"," high"," ratings"," on"," the"," product","."," But"," within"," that"," product"," review",","," they're"," also"," giving"," us"," feedback"," on"," our"," shipping",".\n","So"," we're"," stripping"," the"," product"," review"," out"," and"," we're"," capturing"," the"," fulfillment"," data",","," and"," then"," we're"," able"," to"," share"," that"," with"," our"," partners"," on"," our"," fulfillment"," team"," in"," the"," Midwest"," and"," here"," in"," Seattle","."," We"," can"," say",","," '","There"," seems"," to"," be"," a"," trend"," with"," this"," zip"," code",","," and"," this"," zip"," code"," [","is","]"," getting"," ripped"," boxes",".'"," Or"," with"," this"," division",","," which"," is"," at"," the"," higher"," end"," of"," the"," price"," spectrum",","," the"," customers"," are"," expecting"," a"," nicer"," box"," than"," what"," they're"," getting",".\n","We're"," starting"," to"," uncover"," a"," lot"," of"," these"," trends"," that",","," without"," text"," analytics",","," we"," would"," never"," get"," because"," these"," are"," five","-star"," reviews","."," There's"," nothing"," on"," the"," surface"," that"," would"," seem"," to"," call"," out"," that"," there's"," an"," issue"," or"," a"," problem","."," But"," as"," we"," started"," to"," break"," it"," apart",","," we"," identified"," that"," negative"," sentiment"," can"," be"," included"," within"," those"," reviews",".\n","How"," are"," you"," flag","ging"," content","?"," Is"," that"," done"," manually","?\n","F","isher",":"," Initially",","," we"," did","."," We"," were"," going"," review"," by"," review",","," and"," it"," was"," myself"," and"," another"," colleague"," on"," my"," team","."," Now"," we've"," set"," up"," an"," automated"," process"," where"," basically"," we"," can"," ingest"," a"," large"," set"," of"," data"," into"," a"," Hadoop"," environment"," --"," all"," un","structured"," data"," --"," and"," we"," can"," program","matically"," run"," the"," queries"," we've"," built"," that"," will"," look"," for"," the"," sentiment"," in"," each"," cluster",".\n","We"," utilize"," the"," Stanford"," Natural"," Language"," Processing"," [","N","LP","]"," libraries","."," It's"," a"," free"," tool","set"," for"," NLP"," and"," sentiment"," analysis","."," So"," let's"," say"," it's"," a"," single"," review"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Non-Chat","maxValue":68.1875,"maxValueTokenIndex":853,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,46.53125,0,0,68.1875,0,0,0,0,40.78125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"ytd0n7ggsoxbjue1oib9fja8","tokens":["<|startoftext|>","Part"," ","1",":"," Skip","-","gram"," Feed","forward","\n","Editor's"," Note",":"," This"," post"," is"," part"," of"," a"," series"," based"," on"," the"," research"," conducted"," in"," District"," Data"," Labs","'"," NLP"," Research"," Lab","."," Make"," sure"," to"," check"," out"," the"," other"," posts"," in"," the"," series"," so"," far",":\n","-"," NLP"," Research"," Lab"," Part"," ","1",":"," Distributed"," Represent","ations","\n","-"," NLP"," Research"," Lab"," Part"," ","2",":"," Skip","-Gr","am"," Architecture"," Overview","\n","Let's"," ."," ."," .\n","Editor's"," Note",":"," This"," post"," is"," part"," of"," a"," series"," based"," on"," the"," research"," conducted"," in"," District"," Data"," Labs","'"," NLP"," Research"," Lab","."," Make"," sure"," to"," check"," out"," NLP"," Research"," Lab"," Part"," ","1",":"," Distributed"," Represent","ations",".\n","Ch","ances"," are",","," if"," you","’ve"," been"," working"," in"," Natural"," Language"," Processing"," (","N","LP",")"," or"," machine"," learning",","," you","’ve"," heard"," of"," the"," class"," of"," ."," ."," .\n","How"," I"," Learned"," To"," Stop"," W","orry","ing"," And"," Love"," Word"," Emb","eddings","\n","Editor's"," Note",":"," This"," post"," is"," part"," of"," a"," series"," based"," on"," the"," research"," conducted"," in"," District"," Data"," Labs","'"," NLP"," Research"," Lab",".\n","This"," post"," is"," about"," Distributed"," Represent","ations",","," a"," concept"," that"," is"," foundational"," not"," only"," to"," the"," understanding"," of"," data"," processing"," in"," machine"," learning",","," but"," also"," to"," the"," understanding"," of"," information"," processing"," and"," ."," ."," .\n","Visual","izing"," Text"," with"," Python","\n","In"," this"," article",","," we"," explore"," two"," extremely"," powerful"," ways"," to"," visualize"," text",":"," word"," bubbles"," and"," word"," networks","."," These"," two"," visual","izations"," are"," replacing"," word"," clouds"," as"," the"," def","acto"," text"," visualization"," of"," choice"," because"," they"," are"," simple"," to"," create",","," understandable",","," and"," provide"," deep"," and"," valuable"," at","-a","-gl","ance"," insights","."," In"," this"," post",","," we"," will"," examine"," how"," to"," ."," ."," .\n","Py","Con"," ","201","6"," Tutorial"," on"," Sunday"," May"," ","29",","," ","201","6"," at"," ","9","am","\n","This"," post"," is"," designed"," to"," point"," you"," to"," the"," resources"," that"," you"," need"," in"," order"," to"," prepare"," for"," the"," NLP"," tutorial"," at"," Py","Con"," this"," coming"," weekend","!"," If"," you"," have"," any"," questions",","," please"," contact"," us"," according"," to"," the"," directions"," at"," the"," end"," of"," the"," post",".\n","In"," this"," tutorial",","," we"," will"," explore"," the"," features"," of"," the"," N","LT","K"," library"," for"," text"," processing"," in"," ."," ."," .\n","Sent","iment"," analysis"," is"," a"," common"," application"," of"," Natural"," Language"," Processing"," ("],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Non-Chat","maxValue":65.75,"maxValueTokenIndex":380,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,65.75,23.359375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"jodwoycngy6iqpvs6sdxxmec","tokens":["<|startoftext|>","Update",":"," I"," finished"," my"," tool"," for"," creating"," a"," customized"," voice"," model","."," It"," encaps","ulates"," the"," best"," of"," what"," I"," described"," below","."," See"," here",":"," https","://","github",".com","/","um","hau","/v","mc",".\n","The"," idea"," with"," a"," limited"," vocabulary"," is"," that"," the"," processor"," can"," deal"," with"," far"," less"," information"," in"," order"," to"," detect"," the"," words"," needed","."," You"," don't"," have"," to"," train"," it"," on"," a"," complete"," set"," of"," words"," in"," the"," English"," language",","," and"," you"," don't"," need"," a"," super","computer","."," All"," you"," have"," to"," do"," is"," teach"," it"," a"," few"," words",","," and"," how"," to"," spell"," them","."," The"," tutorial"," is"," here","."," I've"," created"," a"," script"," to"," automate"," the"," voice"," recording"," here",","," and"," st","ashed"," the"," needed"," files"," there"," with"," it",".\n","Preparation","Alright",","," down"," to"," business","."," You'll"," find"," it"," handy"," to"," keep"," a"," folder"," for"," these"," sorts"," of"," programs",".\n","mkdir"," ~/","tools","Install"," git",","," if"," you"," don't"," have"," it"," already",".\n","sudo"," apt","-get"," install"," git","Download"," the"," script"," I"," made"," into"," your"," new"," tools"," folder",".\n","sudo"," git"," clone"," https","://","github",".com","/","um","hau","/train","-","voice","-data","-p","ockets","phinx",".git","Install"," S","phinx","Train","."," I"," included"," it"," among"," the"," files"," you"," just"," downloaded","."," Move"," it"," up"," to"," ~/","tools",","," extract"," and"," install"," it","."," It's"," also"," here",","," if"," you"," don't"," want"," to"," use"," the"," one"," I"," provided",".\n","sudo"," mv"," ~/","tools","/train","-","voice","-data","-p","ockets","phinx","/","extra","_files","/s","phinx","train","-","5","pre","alpha",".tar",".gz"," ~/","tools","\n","sudo"," tar"," -","x","v","zf"," ~/","tools","/s","phinx","train","-","5","pre","alpha",".tar",".gz"," -","C"," ~/","tools","\n","make"," -","j"," ","4","\n","make"," -","j"," ","4"," install","\n","Record"," Your"," Voice","Enter"," this"," directory",","," run"," the"," script","."," It'll"," have"," a"," basic"," walkthrough"," built","-in","."," This"," will"," help"," you"," record"," the"," data"," you"," need","."," For"," experimental"," purposes",","," ","20"," recordings"," is"," enough"," for"," about"," ","10","%"," relative"," improvement"," in"," accuracy","."," Use"," the"," name"," neo","-en"," for"," your"," training"," data",","," assuming"," you're"," working"," in"," English",".\n","cd"," ./","train","-","voice","-data","-p","ockets","phinx","You'll"," find"," your"," recordings"," in"," a"," sub","folder"," with"," the"," same"," name"," as"," what"," you"," specified","."," Go"," there",".\n","cd"," ./","neo","-en","By"," the"," way",","," if"," you"," ever"," change"," your"," mind"," about"," what"," you"," want"," your"," model"," to"," be"," named",","," there's"," a"," fantastic"," program"," called"," py","ren","amer"," that"," can"," make"," it"," easy"," to"," rename"," all"," the"," files"," you"," created","."," Install"," it"," with",":\n","sudo"," apt","-get"," install"," py","ren","amer","\n","Process"," Your"," Voice"," Record","ings","Great","!"," Done"," with"," that"," part","."," Now"," we're"," going"," to"," copy"," some"," other"," directories"," into"," the"," current"," working"," directory"," to"," '","work"," on"," them","'.\n","cp"," -","a"," /","usr","/local","/share","/p","ockets","phinx","/model","/en","-us","/en","-us"," .","Based"," on"," this"," source",","," it"," looks"," like"," we"," shouldn't"," be"," working"," with"," .","d","mp"," files","."," This"," is"," a"," point"," of"," deviation"," from"," the"," (","out","dated",")"," CM","U"," walkthrough","."," Copy"," the"," .","bin"," file"," instead","."," Difference"," is"," explained"," below",","," sourced"," from"," the"," tutorial",".\n","cp"," -","a"," /","usr","/local","/share","/p","ockets","phinx","/model","/en","-us","/c","mud","ict","-en","-us",".dict"," .\n","cp"," -","a"," /","usr","/local","/share","/p","ockets","phinx","/model","/en","-us","/en","-us",".l","m",".bin"," .\n","Language"," model"," can"," be"," stored"," and"," loaded"," in"," three"," different"," format"," -"," text"," AR","PA"," format",","," binary"," format"," BIN"," and"," binary"," D","MP"," format","."," AR","PA"," format"," takes"," more"," space"," but"," it"," is"," possible"," to"," edit"," it","."," AR","PA"," files"," have"," .","lm"," extension","."," Binary"," format"," takes"," significantly"," less"," space"," and"," faster"," to"," load","."," Binary"," files"," have"," .","lm",".bin"," extension","."," It"," is"," also"," possible"," to"," convert"," between"," formats","."," D","MP"," format"," is"," obsolete"," and"," not"," recommended",".Now",","," while"," still"," in"," this"," directory",","," generate"," some"," '","ac","oustic"," feature"," files","'.\n","s","phinx","_fe"," -","arg","file"," en","-us","/","feat",".params"," -","sam","pr","ate"," ","160","00"," -","c"," neo","-en",".file","ids"," -","di"," ."," -","do"," ."," -","ei"," wav"," -","eo"," m","fc"," -","ms","wav"," yes","\n","Get"," the"," Full","-S","ized"," Language"," Model","Nice","."," You"," have"," a"," bunch"," more"," files"," with"," weird"," extensions"," on"," them","."," Now"," it's"," time"," to"," convert"," them","."," You"," need"," the"," full"," version"," of"," the"," language"," model",","," which"," was"," not"," shared"," with"," your"," original"," installation"," for"," size"," reasons","."," I"," included"," it"," in"," the"," github"," repository",","," or"," you"," can"," download"," it"," from"," here"," (","you"," want"," the"," file"," named"," cm","us","phinx","-en","-us","-","pt","m","-","5",".","2",".tar",".gz",")."," Put"," the"," extracted"," files"," in"," your"," neo","-en"," directory",".\n","Ass","uming"," you"," use"," the"," one"," from"," the"," github"," repo"," and"," you're"," still"," in"," the"," neo","-en"," sub","directory",",\n","tar"," -","x","v","zf"," ../","extra","_files","/c","mus","phinx","-en","-us","-","pt","m","-","5",".","2",".tar",".gz"," -","C"," .","There's"," an"," folder"," labeled"," en","-us"," within"," the"," neo","-en"," folder"," that"," was"," created"," when"," you"," made"," the"," acoustic"," feature"," files","."," Give"," it"," an"," extension"," and"," save"," it"," in"," case"," of"," horrible"," mistakes",".\n","mv"," ./","en","-us"," ./","en","-us","-original","Now"," move"," the"," newly"," extracted"," directory"," to"," your"," neo","-en"," folder",","," and"," rename"," it"," to"," en","-us",".\n","mv"," ./","cm","us","phinx","-en","-us","-","pt","m","-","5",".","2"," ./","en","-us","This"," converts"," the"," binary"," m","def"," file"," into"," a"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Non-Chat","maxValue":65.75,"maxValueTokenIndex":495,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,48.6875,30.453125,65.75,43.0625,63.09375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,28,34.625,0,0,0,53.625,23.484375,58.75,0,0,0,0,38.59375,0,0,0,0,0,0,0,0,0,0,0,0,25.21875,0,47.4375,0,31.09375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,58.5625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,28.6875,55.84375,0,0,0,27.859375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,52.34375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,23.453125,39.4375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,25.734375,24.203125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"k99wo0stx44dm2ou5ct3afhw","tokens":["<|startoftext|>","To"," download"," the"," data"," click"," on"," \"","Get"," the"," Data","\""," within"," the"," article"," and"," then"," download"," the"," data"," in"," .","csv"," format","."," The"," data"," set"," contains"," the"," total"," number"," of"," murders",","," total"," firearm"," murders"," in"," ","201","0"," and"," ","200","9",","," total"," handgun"," murders",","," and"," the"," rates"," of"," firearm"," murder",","," robbery",","," and"," assault"," per"," ","100",",","000"," population"," in"," all"," ","50"," states","."," Note"," that"," there"," are"," missing"," data"," for"," Florida",".\n","After"," the"," data"," are"," downloaded"," open"," them"," in"," a"," spreadsheet"," application","."," Delete"," the"," second"," row"," that"," contains"," the"," totals"," for"," the"," entire"," United"," States","."," We"," only"," want"," data"," for"," states","."," Once"," completed"," save"," the"," file"," as"," US","_G","un",".csv","\n","Next",","," we"," need"," to"," download"," a"," shap","efile"," for"," the"," ","50"," U",".S","."," states","."," Go"," to"," the"," U",".S","."," Census"," Tiger","/","Line"," Files"," webpage"," to"," download"," the"," shap","efile","."," Under"," the"," \"","Select"," Layer"," Type","\""," drop"," down"," menu"," choose"," \"","States"," (","and"," equivalent",")\"",".\n","|","Tiger","/","Line"," Files"," webpage","|\n","On"," the"," next"," webpage",","," under"," the"," \"","State"," and"," Equivalent"," (","201","0",")\""," drop"," down"," menu"," choose"," \"","All"," states"," in"," one"," national"," file","\""," and"," then"," click"," download",".\n","After"," the"," data"," are"," downloaded"," open"," the"," shap","efile"," in"," Cart","ograph","ica",".\n","Next",","," to"," import"," and"," join"," the"," .","csv"," file"," containing"," the"," gun"," data"," to"," the"," U",".S","."," states"," shap","efile"," use"," the"," following"," steps",".\n","1","."," Click"," File"," >"," Import"," Table"," data"," >"," Choose"," the"," US","_G","un",".csv"," file","\n","2","."," Next",","," we"," need"," to"," match"," the"," .","csv"," file"," to"," the"," states"," shap","efile","."," Click"," on"," the"," Join"," tab"," in"," the"," top"," right"," of"," the"," import"," file"," window",".\n","3","."," Change"," \"","Target"," Layer","\""," in"," the"," bottom"," right"," to"," tl","_","201","0","_us","_state","10"," (","this"," should"," be"," the"," title"," of"," the"," state"," shap","efile",").\n","4","."," Under"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Non-Chat","maxValue":62.3125,"maxValueTokenIndex":324,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,24.078125,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,62.3125,32.65625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"w449eav4doe9fwhsu6h0w2rk","tokens":["<|startoftext|>","Because"," I","’m"," easily"," distracted",","," I"," thought"," I","’d"," take"," on"," the"," challenge","."," Surely"," it"," would"," be"," possible"," to"," set"," up"," the"," sharing"," buttons"," logically",","," so"," that"," they"," could"," be"," easily"," implemented"," on"," any"," post","."," I"," started"," with"," Paul"," Under","wood","’s"," excellent"," and"," really"," helpful"," post"," about"," how"," to"," create"," sharing"," links"," for"," each"," of"," the"," major"," social"," networks","."," Within"," a"," couple"," of"," days",","," I"," had"," a"," functional"," plugin"," in"," hand",","," which"," quietly"," added"," social"," sharing"," buttons"," to"," the"," end"," of"," posts",".\n","At"," that"," point",","," I"," added"," the"," plugin"," to"," my"," own"," site",","," shared"," it"," with"," a"," few"," friends",","," and"," then"," pretty"," much"," ignored"," it","."," It"," was"," possible"," to"," customize"," the"," plugin","–","possible"," for"," developers",","," anyway","–","with"," jud","icious"," use"," of"," filters",","," one"," could"," do"," simple"," things",","," like"," add"," the"," author","’s"," twitter"," handle",","," or"," more"," complex"," things",","," like"," add"," new"," social"," networks"," to"," the"," buttons","."," By"," default",","," the"," buttons"," were"," added"," only"," to"," posts",","," but"," it"," was"," possible"," (","with"," another"," filter","),"," to"," add"," them"," to"," other"," post"," types"," as"," well","."," It"," did"," what"," I"," needed",","," so"," I"," polished"," it"," a"," bit"," and"," then"," ignored"," it","."," Although"," I"," considered"," submitting"," it"," to"," the"," Word","Press"," plugin"," repository",","," I"," chose"," not"," to","–","although"," my"," little"," plugin"," was"," very"," developer"," friendly",","," it"," wasn","’t"," user"," friendly",","," and"," I"," was"," concerned"," that"," the"," lack"," of"," settings"," (","for"," something"," as"," small"," as"," the"," twitter"," handle",","," for"," example",")"," would"," be"," a"," stumbling"," block"," for"," the"," average"," user","."," And"," I"," felt"," that"," interest"," in"," this"," kind"," of"," plugin"," would"," be"," fairly"," limited",","," because"," the"," buttons"," are"," so"," incredibly"," simple",".\n","Towards"," the"," end"," of"," February",","," one"," of"," my"," users"," (","possibly"," the"," only"," one"," at"," that"," point"," other"," than"," myself",")"," contacted"," me"," and"," asked"," me"," to"," consider"," submitting"," the"," plugin"," to"," the"," official"," repository",","," in"," order"," to"," take"," advantage"," of"," its"," powerful"," update"," system","/process","."," While"," I"," agreed"," that"," I"," enjoyed"," using"," the"," plugin",","," and"," it"," worked"," quite"," nicely",","," I"," really"," didn","’t"," consider"," that"," very"," many"," people"," would"," be"," interested"," in"," using"," it",","," certainly"," not"," without"," some"," kind"," of"," easier"," to"," access"," settings",".\n","You"," May"," Also"," Like",":\n","Over"," the"," course"," of"," another"," weekend",","," I"," put"," my"," head"," down"," and"," built"," a"," settings"," page",","," which"," included"," not"," only"," an"," easy"," way"," to"," add"," a"," twitter"," handle",","," but"," also"," allowed"," users"," to"," select"," post"," types"," on"," which"," to"," add"," sharing"," buttons",","," as"," well"," as"," which"," buttons"," to"," show","."," Users"," who"," want"," to"," implement"," their"," own"," styling"," can"," easily"," remove"," the"," plugin"," styling"," from"," the"," settings"," page"," as"," well",","," so"," it","’s"," still"," pretty"," developer","/des","igner"," friendly","."," Another"," few"," days",","," and"," the"," plugin"," was"," approved"," for"," the"," Word","Press"," plugin"," repository",".\n","I"," still"," thought"," that"," I"," was"," writing"," this"," plugin"," primarily"," for"," myself",","," so"," I"," was"," mildly"," aston","ished"," (","and"," grat","ified",")"," to"," see"," an"," immediate",","," and"," generally"," positive",","," response","."," Because"," of"," not"," using"," any"," scripts",","," there"," are"," some"," limitations"," to"," the"," plugin",":"," no"," sharing"," counts",","," for"," example",","," and"," posts"," with"," no"," featured","/","associated","/","attached"," images"," will"," not"," output"," a"," Pinterest"," button"," (","because"," the"," first"," rule"," of"," Pinterest"," is"," that"," we"," don","’t"," share"," things"," without"," an"," image",")."," But"," within"," its"," limitations",","," it"," works"," simply"," and"," efficiently","."," One"," note",":"," although"," I"," write"," some"," plugins"," which"," work"," only"," on"," sites"," using"," the"," Genesis"," Framework",","," this"," isn","’t"," one"," of"," them","."," It"," should"," work"," with"," any"," theme"," (","it"," works"," with"," the"," default"," Twenty"," themes",").\n","So",","," if"," you","’re"," interested"," in"," using"," a"," social"," sharing"," plugin"," with"," very"," little"," overhead","–","no"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Non-Chat","maxValue":62.3125,"maxValueTokenIndex":639,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,62.3125,23.46875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"u6tfopiyvz0wrt23thsg0yur","tokens":["<|startoftext|>","Last"," Updated",":"," ","201","8","-","07","-","18"," ","02",":","38",":","21"," UTC","\n","by"," Scott"," F","end","ley"," (","Version",":"," ","1",")\n","Oracle"," released"," their"," quarterly"," critical"," patch"," update"," today","."," This"," patch"," addresses"," a"," record"," number"," of"," ","334"," vulnerabilities"," across"," a"," wide"," set"," of"," Oracle"," supported"," products",".\n","V","ulner","abilities"," in"," Web","logic",","," Oracle"," Spatial",","," and"," Oracle"," Fusion"," Middleware"," Map","Viewer"," are"," rated"," with"," CV","SS"," scores"," of"," ","9",".","8","."," Des","erialization"," based"," attacks"," within"," Web","logic"," server"," has"," been"," used"," as"," attack"," vectors"," in"," the"," past"," year",","," and"," used"," to"," install"," crypto"," miner"," campaigns","."," It"," is"," likely"," that"," these"," types"," of"," campaigns"," will"," continue"," for"," the"," for","see","able"," future",".\n","We"," recommend"," the"," review"," of"," the"," full"," CPU"," release"," to"," identify"," impacted"," software"," packages"," within"," your"," organization",","," and"," make"," plans"," to"," address"," those"," that"," create"," the"," largest"," risk","."," The"," full"," bulletin"," is"," available"," at"," Oracle"," at"," the"," URL"," http","://","www",".oracle",".com","/","techn","etwork","/security","-ad","vis","ory","/c","pu","jul","201","8","-","425","824","7",".html"," .\n","Scott"," F","end","ley"," ISC"," Handler","\n","Last"," Updated",":"," ","201","8","-","07","-","17"," ","11",":","48",":","00"," UTC","\n","by"," Xavier"," M","ert","ens"," (","Version",":"," ","1",")\n","For"," the"," human"," brain",","," an"," IP"," address"," is"," not"," the"," best"," IOC"," because",","," like"," phone"," numbers",","," we"," are"," bad"," to"," remember"," them","."," That","’s"," why"," DNS"," was"," created","."," But",","," in"," many"," log"," management"," applications",","," there"," are"," features"," to"," enrich"," collected"," data","."," One"," of"," the"," possible"," enrichment"," for"," IP"," addresses"," is"," the"," ge","ol","ocal","ization","."," Based"," on"," databases",","," it"," is"," possible"," to"," locate"," an"," IP"," address"," based"," on"," the"," country"," and","/or"," the"," city","."," This"," information"," is"," available"," in"," our"," D","Shield"," IP"," reputation"," database","."," But"," you"," can"," also"," find"," coordinates"," with"," a"," latitude"," and"," a"," longitude",":\n","$$"," geo","ip","lookup"," isc",".s","ans",".edu"," Geo","IP"," Country"," Edition",":"," US",","," United"," States"," Geo","IP"," City"," Edition",","," Rev"," ","1",":"," US",","," MD",","," Maryland",","," Bethesda",","," ","208","14",","," ","39",".","006","001",","," -","77",".","102","501",","," ","511",","," ","301"," Geo","IP"," AS","Num"," Edition",":"," AS","626","69"," S","ANS"," IN","STITUTE","\n","The"," command"," geo","ip","lookup",","," as"," well"," as"," the"," Geo","IP"," databases",","," are"," developed"," by"," Max","mind"," "," which"," is"," one"," of"," the"," companies"," which"," provide"," this"," kind"," of"," services","."," Of"," course",","," you"," can"," also"," create"," your"," own","/private"," database"," of"," IP"," address"," (","or"," sub","nets",")"," and"," attach"," coordinates"," to"," them","."," This"," is"," very"," useful"," if"," you"," operate"," a"," worldwide"," network"," or"," if"," you","’re"," based"," in"," a"," large"," country"," like"," the"," United"," States","."," In"," this"," case",","," if"," sub","nets"," are"," assigned"," per"," branch"," offices",","," you"," can"," search"," for"," their"," coordinates"," via"," Google"," maps"," and"," populate"," your"," database",":\n","Once"," this"," exercise"," completed",","," the"," idea"," is"," to"," compute"," the"," distance"," between"," two"," IP"," addresses"," using"," the","”","H","avers","ine","”"," formula"," which"," determines"," the"," distance"," between"," two"," points"," on"," a"," sphere"," given"," their"," long","itudes"," and"," lat","itudes","."," Here"," is"," a"," quick"," and"," dirty"," Python"," script"," which"," implements"," the"," formula"," for"," two"," IP"," addresses"," Geo","IP"," look","ups",":\n","#!/","usr","/bin","/python"," import"," sys"," import"," geo","ip","2",".database"," import"," math"," def"," hav","ers","ine","((","lat","1",","," long","1","),"," (","lat","2",","," long","2",")):"," radius"," ="," ","637","1"," #"," In"," kilometers"," d","Lat"," ="," math",".r","adians","(lat","2"," -"," lat","1",")"," d","Long"," ="," math",".r","adians","(long","2"," -"," long","1",")"," a"," ="," (","math",".sin","(d","Lat"," /"," ","2",")"," **"," ","2"," +"," math",".cos","(math",".r","adians","(lat","1","))"," *"," math",".cos","(math",".r","adians","(lat","2","))"," *"," math",".sin","(d","Long"," /"," ","2",")"," **"," ","2",")"," c"," ="," ","2"," *"," math",".atan","2","(math",".sqrt","(a","),"," math",".sqrt","(","1"," -"," a","))"," d"," ="," radius"," *"," c"," return"," d"," reader","=","geo","ip","2",".database",".Reader","('","Geo","Lite","2","-C","ity",".mm","db","')"," r","1"," ="," reader",".city","(sys",".argv",")"," r","2"," ="," reader",".city","(sys"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Non-Chat","maxValue":60.59375,"maxValueTokenIndex":723,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,60.59375,42.65625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"kuibcxyg4d84dt63ndl0ekft","tokens":["<|startoftext|>","Just"," upgraded"," to"," ","3",".","1",","," and"," I"," noticed"," the"," \"","Editor","\""," button"," under"," \"","Appearance","\""," is"," now"," gone","."," ..."," Tried"," it"," with"," the"," Twenty","-ten"," theme"," to"," make"," sure"," it"," wasn't"," a"," theme"," issue","."," No"," matter"," which"," theme"," I"," choose",","," it"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Non-Chat","maxValue":55.90625,"maxValueTokenIndex":30,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,55.90625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"r0xoqtys97k1gespn424w0qu","tokens":["<|startoftext|>","We"," do"," our"," best"," to"," monitor"," the"," tickets"," around"," the"," clock",","," however",","," this"," is"," not"," always"," possible"," due"," to"," different"," time","zones",","," We"," checking"," support"," system"," several"," times"," in"," the"," day","."," Reply"," times"," can"," vary"," from"," time"," to"," time"," and"," be"," up"," to"," ","24"," hours"," Monday"," –"," Friday"," and"," up"," to"," ","48"," hours"," on"," weekends",","," Sat"," -"," Sun","."," but"," is"," usually"," faster"," than"," that",".\n","Welcome"," to"," J","WS","Theme","'s"," Support"," Center","\n","Please"," make"," sure"," you"," include"," the"," following"," information"," for"," quick"," and"," smooth"," support",":\n","-"," Purchase"," Code",".\n","If"," you"," do"," not"," include"," a"," purchase"," code",","," we"," may"," request"," this"," information"," as"," our"," first"," response",".\n","-"," Link"," to"," your"," site",".\n","If"," something"," isn't"," working",","," please"," send"," us"," a"," link"," to"," the"," page"," where"," it"," isn't"," working",".\n","-"," Include"," FTP",","," Word","Press"," login"," info",","," links"," related"," and"," screenshots"," are"," always"," welcome","!"," Provide"," us"," with"," all"," the"," information"," you"," can"," give"," us","!"," The"," fastest"," way"," for"," us"," to"," help"," is"," for"," us"," to"," view"," your"," backend"," setup",".\n","-"," What"," theme"," version"," installed","\n","If"," the"," theme"," has"," issues",","," please"," tell"," us"," the"," theme"," version"," you're"," having"," trouble"," with",".\n","-"," Prepare"," your"," installation","\n","Switch"," to"," the"," Twenty","F","if","teen"," theme"," before"," you"," create"," the"," ticket","."," Please"," test"," this"," before"," opening"," your"," ticket"," so"," we"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Non-Chat","maxValue":49.65625,"maxValueTokenIndex":219,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,49.65625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"hmi3ct8vjdgrafzadblqimwl","tokens":["<|startoftext|>","Phy","logen","omic"," analysis"," of"," UDP"," gly","cos","yl","transfer","ase"," ","1"," mult","ig","ene"," family"," in"," Lin","um"," us","itat","iss","imum"," identified"," genes"," with"," varied"," expression"," patterns","\n","©"," Bar","v","kar"," et"," al",";"," license","e"," Bio","Med"," Central"," Ltd","."," ","201","2","\n","Received",":"," ","30"," September"," ","201","1","\n","Accepted",":"," ","8"," May"," ","201","2","\n","Published",":"," ","8"," May"," ","201","2","\n","The"," gly","cos","yl","ation"," process",","," catal","y","zed"," by"," ubiquitous"," gly","cos","yl","transfer","ase"," (","GT",")"," family"," enzymes",","," is"," a"," prevalent"," modification"," of"," plant"," secondary"," metabolites"," that"," regulates"," various"," functions"," such"," as"," hormone"," home","ostasis",","," detox","ification"," of"," xen","obi","otics"," and"," bios","ynthesis"," and"," storage"," of"," secondary"," metabolites","."," Fl","ax"," (","L","inum"," us","itat","iss","imum"," L",".)"," is"," a"," commercially"," grown"," oil","seed"," crop",","," important"," because"," of"," its"," essential"," fatty"," acids"," and"," health"," promoting"," lign","ans","."," Identification"," and"," characterization"," of"," UDP"," gly","cos","yl","transfer","ase"," (","UG","T",")"," genes"," from"," flax"," could"," provide"," valuable"," basic"," information"," about"," this"," important"," gene"," family"," and"," help"," to"," explain"," the"," seed"," specific"," gly","cos","yl","ated"," metabol","ite"," accumulation"," and"," other"," processes"," in"," plants","."," Plant"," genome"," sequencing"," projects"," are"," useful"," to"," discover"," complexity"," within"," this"," gene"," family"," and"," also"," pave"," way"," for"," the"," development"," of"," functional"," genom","ics"," approaches",".\n","Taking"," advantage"," of"," the"," newly"," assembled"," draft"," genome"," sequence"," of"," flax",","," we"," identified"," ","137"," UDP"," gly","cos","yl","transfer","ase"," (","UG","T",")"," genes"," from"," flax"," using"," a"," conserved"," signature"," motif","."," Ph","y","logen","etic"," analysis"," of"," these"," protein"," sequences"," clustered"," them"," into"," ","14"," major"," groups"," (","A","-N",")."," Expression"," patterns"," of"," these"," genes"," were"," investigated"," using"," publicly"," available"," expressed"," sequence"," tag"," (","EST","),"," micro","array"," data"," and"," reverse"," transcription"," quantitative"," real"," time"," PCR"," (","RT","-q","PCR",")."," Se","venty","-three"," per"," cent"," of"," these"," genes"," (","100"," out"," of"," ","137",")"," showed"," expression"," evidence"," in"," ","15"," tissues"," examined"," and"," indicated"," varied"," expression"," profiles","."," The"," RT","-q","PCR"," results"," of"," ","10"," selected"," genes"," were"," also"," coherent"," with"," the"," digital"," expression"," analysis","."," Interestingly",","," five"," duplicated"," U","GT"," genes"," were"," identified",","," which"," showed"," differential"," expression"," in"," various"," tissues","."," Of"," the"," seven"," intr","on"," loss","/g","ain"," positions"," detected",","," two"," intr","on"," positions"," were"," conserved"," among"," most"," of"," the"," U","GT","s",","," although"," a"," clear"," relationship"," about"," the"," evolution"," of"," these"," genes"," could"," not"," be"," established","."," Comparison"," of"," the"," flax"," U","GT","s"," with"," orth","olog","s"," from"," four"," other"," sequ","enced"," dic","ot"," genomes"," indicated"," that"," seven"," U","GT","s"," were"," flax"," diver","ged",".\n","Fl","ax"," has"," a"," large"," number"," of"," U","GT"," genes"," including"," few"," flax"," diver","ged"," ones","."," Ph","y","logen","etic"," analysis"," and"," expression"," profiles"," of"," these"," genes"," identified"," tissue"," and"," condition"," specific"," repertoire"," of"," U","GT"," genes"," from"," this"," crop","."," This"," study"," would"," facilitate"," precise"," selection"," of"," candidate"," genes"," and"," their"," further"," characterization"," of"," substrate"," specific","ities"," and"," in"," planta"," functions",".\n","Fl","ax"," or"," lin","seed"," (","L","inum"," us","itat","iss","imum"," L",".)"," is"," one"," of"," the"," earliest"," domest","icated"," crops","."," It"," is"," a"," self","-p","oll","inating"," dip","loid"," species"," cultivated"," as"," a"," source"," of"," fibre",","," oil"," and"," medicinal"," compounds","."," Historically"," it"," has"," been"," used"," as"," a"," model"," for"," developmental"," studies"," and"," has"," a"," different"," evolutionary"," history"," than"," other"," model"," plants"," like"," Arab","id","opsis"," ."," Among"," plant"," foods",","," flax","seed"," has"," the"," highest"," contents"," of"," the"," essential"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Non-Chat","maxValue":49.59375,"maxValueTokenIndex":588,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,49.59375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"r6ihrzzlqyf2hmcc50i6gc3g","tokens":["<|startoftext|>","Last"," Activity",":","11","-","18","-","201","1"," ","10",":","39"," PM","\n","Posted"," in"," thread",":"," First"," Brew"," -"," A","HS"," American"," Amber"," Ale"," on"," ","09","-","22","-","200","9"," at"," ","12",":","36"," AM","\n","Did"," you"," use"," a"," liquid"," yeast"," or"," dry"," one","?","you"," asking"," me","?","I"," used"," the"," White"," Labs"," yeast"," (","W","LP","051",")"," that","\n","came"," with"," the"," A","HS"," kit",":\n","Posted"," in"," thread",":"," First"," Brew"," -"," A"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Non-Chat","maxValue":48.5625,"maxValueTokenIndex":65,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,48.5625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"qddsp3blemouxgl78uh91o6p","tokens":["<|startoftext|>","Recursive"," Deep"," Models"," for"," Semantic"," Com","pos","itional","ity"," Over"," a"," Sent","iment"," Tree","bank",","," Richard"," So","cher",","," Alex"," Per","ely","gin",","," Jean"," Wu",","," Jason"," Ch","uang",","," Chris"," Manning",","," Andrew"," Ng"," and"," Chris"," Pot","ts","."," Conference"," on"," Emp","irical"," Methods"," in"," Natural"," Language"," Processing"," (","EM","N","LP"," ","201","3",","," Oral",")."," pdf",";","Website"," with"," Live"," Demo"," and"," Downloads","\n"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Non-Chat","maxValue":46.25,"maxValueTokenIndex":34,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,46.25,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,23.65625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"us31n8hmgfu7it5l4fkzr61m","tokens":["<|startoftext|>","Which"," genome"," assemblies"," does"," GREAT"," support","?\n","Currently",","," GREAT"," supports"," recent"," assemblies"," of"," the"," well","-","annot","ated"," human"," (","U","CSC"," hg","19"," and"," UCS","C"," hg","18",")"," and"," mouse"," (","U","CSC"," mm","9",")"," genomes","."," GREAT"," can"," be"," expanded"," to"," include"," additional"," well","-","annot","ated"," genomes"," (","such"," as"," Zeb","raf","ish","),"," and"," can"," also"," be"," expanded"," into"," poorly","-character","ized"," genomes"," by"," carefully"," projecting"," annotations"," from"," well","-","annot","ated"," genomes","."," We"," hope"," to"," gradually"," expand"," the"," set"," of"," species"," we"," support",".\n","Can"," I"," use"," a"," different"," species"," or"," assembly","?\n","If"," you"," have"," genomic"," regions"," defined"," for"," a"," different"," species"," or"," assembly"," from"," the"," ones"," we"," currently"," support",","," you"," can"," use"," the"," UCS","C"," Lift","Over"," utility"," to"," convert"," to"," a"," supported"," assembly","."," The"," Lift","Over"," typically"," works"," very"," well"," for"," within"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Non-Chat","maxValue":45.6875,"maxValueTokenIndex":37,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,29.953125,28.78125,0,0,0,0,25.65625,0,0,0,0,0,0,0,45.6875,30.984375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,33.71875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"dfbcp1xh00qmfvqy0hu3q8gw","tokens":["<|startoftext|>","News"," Blog",":"," Word","Press"," &"," Joomla"," Extensions","\n","Wel","coming"," Word","Press"," ","5",".","0"," and"," the"," New"," Digital"," Print","\n","It"," has"," been"," months"," in"," the"," making","."," Issues"," opened",","," and"," issues"," resolved","."," Hundreds"," of"," collaborators",","," working"," on"," a"," single"," project"," to"," bring"," out"," the"," best"," of"," it","."," Most"," importantly",","," a"," production","-ready"," system"," came"," out"," of"," it","."," Word","Press"," ","5",".","0"," is"," finally"," released",".\n","During"," the"," past"," few"," months",","," we"," have"," been"," patiently"," observing"," Word","Press"," developing"," to"," become"," the"," fully","-fledged"," Content"," Management"," System"," that"," it"," is"," today","."," Pat","ience"," was"," rewarded"," on"," December"," ","6",","," when"," the"," fifth"," major"," version"," was"," released"," into"," the"," wild",".\n","This"," time",","," it"," is"," not"," just"," any"," release","."," Word","Press"," ","5",".","0"," packs"," some"," of"," the"," most"," drastic"," changes"," in"," its"," history","."," Most"," notably",","," the"," switch"," to"," the"," Gutenberg"," editor"," alters"," the"," way"," we"," think"," about"," content"," creation",","," though"," the"," shift"," is"," not"," being"," enforced"," just"," yet",".\n","G","uten","berg"," is"," an"," editor",","," but"," also"," much"," more"," than"," that","."," The"," idea"," behind"," Gutenberg"," isn","’t"," to"," change"," the"," way"," bloggers"," create"," content"," for"," the"," sake"," of"," change"," -"," the"," Classic"," editor"," was"," doing"," the"," job"," fine",","," after"," all","."," Instead",","," Gutenberg"," transforms"," the"," way"," that"," Word","Press"," sees"," and"," interpre","ts"," content",".\n","If"," you"," are"," new"," to"," the"," entire"," idea"," of"," Gutenberg",","," it"," suff","ices"," to"," say"," that"," the"," editor"," does"," not"," create"," Word","Press"," posts"," and"," pages"," in"," one"," mon","olithic"," chunk","."," On"," the"," contrary",","," content"," is"," made"," up"," of"," a"," sequence"," of"," blocks",".\n","In"," this"," way",","," paragraphs",","," media"," and"," anything"," else"," that"," you"," might"," think"," of"," are"," next"," to"," each"," other"," as"," autonomous"," units","."," The"," blocks"," can"," be"," edited",","," moved"," around"," and"," switched"," out"," without"," affecting"," neighbouring"," elements","."," On"," top"," of"," that",","," some"," can"," even"," contain"," other",","," smaller"," blocks","."," In"," short",","," Gutenberg"," is"," as"," simple"," or"," versatile"," as"," you","’d"," want"," it"," to"," be",".\n","This"," flexibility"," permits"," Gutenberg"," to"," become"," a"," spring","board"," for"," more"," development","."," Other"," plugins"," have"," already"," started"," to"," surface",","," including"," J","oom","United","’s"," own"," Advanced"," Gutenberg","."," Their"," goal","?"," Expl","o","iting"," a"," solid"," infrastructure"," to"," expand"," your"," tool","set"," with"," even"," more"," blocks",".\n","G","uten","berg","’s"," structure"," is"," permiss","ive"," of"," more"," functionality"," that"," would"," not"," have"," been"," possible"," with"," the"," Classic"," editor","."," Blocks"," can"," be"," saved"," to"," be"," reused"," at"," a"," later"," stage",","," like"," templates","."," This"," makes"," it"," more"," difficult"," to"," irrev","oc","ably"," make"," erroneous"," design"," changes"," to"," your"," Word","Press"," blog",".\n","Moreover",","," this"," principle"," is"," ever","-present"," throughout"," Word","Press"," ","5",".","0","."," From"," individual"," block"," structures"," to"," themes"," themselves",","," Word","Press"," protects"," creations"," from"," inadvert","ent"," edits","."," However",","," if"," you"," don","’t"," want"," to"," up","end"," your"," workflow"," just"," yet",","," you"," don","’t"," have"," to",".\n","The"," Good"," Old"," Editor","\n","G","uten","berg"," has"," come"," a"," long"," way"," since"," its"," bug","-r","idd","led"," days","."," In"," spite"," of"," its"," advantages",","," it"," may"," not"," be"," enough"," reason"," to"," switch"," over"," from"," the"," traditional"," editing"," experience","."," The"," Classic"," Editor"," plugin"," is"," Word","Press","’"," solution"," to"," continue"," wall","owing"," in"," the"," nostalgia"," of"," byg","one"," days","."," In"," many"," ways",","," the"," editor"," is"," identical"," to"," the"," one"," you"," were"," used"," to",","," except"," for"," the"," fact"," that"," it"," needs"," to"," be"," installed"," anew"," now",".\n","Nonetheless",","," as"," alluring"," as"," it"," may"," sound",","," you"," might"," not"," want"," to"," over","stay"," the"," plugin","’s"," welcome","."," Word","Press"," has"," already"," said"," that"," official"," support"," will"," continue"," up"," until"," ","202","1",","," after"," which"," no"," fixes"," will"," be"," forthcoming",".\n","Although"," ","202","1"," sounds"," far","-off",","," it"," is"," highly"," likely"," that"," just"," about"," anything"," related"," to"," Word","Press"," will"," migrate"," to"," Gutenberg","."," And"," that"," transition"," has"," already"," started","."," Word","Press"," ","5",".","0"," includes"," a"," new"," default"," theme"," -"," Twenty"," N","inete","en","."," No"," surprises"," in"," the"," name",","," but"," the"," design"," has"," been"," built"," using"," Gutenberg"," itself"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Non-Chat","maxValue":45.59375,"maxValueTokenIndex":697,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,45.59375,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"hrw3tl54cb62mxvbdmocbsr1","tokens":["<|startoftext|>","By"," building"," your"," own"," humidity"," control"," system"," with"," just"," an"," Io","T"," enabled"," Arduino"," board"," and"," a"," basic"," humid","ifier"," you"," can"," monitor"," and"," control"," the"," humidity"," levels"," in"," your"," home"," to"," stay"," at"," comfortable"," and"," healthy"," levels",".\n","This"," is"," What"," You"," Need","\n","-"," Arduino"," Nano"," ","33"," Io","T"," /"," Arduino"," Nano"," RP","204","0"," Connect","\n","-"," Air"," humid","ifier","\n","-"," Temperature"," &"," humidity"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Non-Chat","maxValue":44.6875,"maxValueTokenIndex":50,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,44.6875,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"gqc1r0etk50g7jlryhq4ptki","tokens":["<|startoftext|>","Browse"," and"," Enjoy"," Reading","!\n","Guys",","," another"," major"," release"," of"," B","WP"," G","XS"," is"," now"," available","!"," The"," biggest"," change"," made"," since"," ","1",".","1",".","6"," is"," the"," ability"," to"," build"," a"," Google"," News"," sitemap"," that"," can"," be"," submitted"," to"," Google"," News"," without"," hassle"," :","D",".\n","All"," you"," have"," to"," do"," is"," click"," on"," the"," newly"," added"," tab"," (","News"," sitemap","),"," enable"," the"," module",","," choose"," some"," news"," categories"," as"," well"," as"," their"," genres"," and"," you're"," ready"," to"," go","."," Your"," news"," sitemap"," can"," also"," be"," used","..."," more","\n","After"," reading"," Small"," Giants",":"," Companies"," That"," Choose"," to"," Be"," Great"," Instead"," of"," Big"," written"," by"," Bo"," Burl","ingham"," I"," have"," come"," up"," with"," the"," idea"," of"," writing"," about"," small"," plugins"," that"," can"," greatly"," improve"," functionality"," for"," your"," blog","."," If"," you"," think"," a"," great"," plugin"," needs"," to"," be"," huge",","," you"," are"," definitely"," wrong"," and"," you"," should"," go"," see"," the"," book"," I"," have"," mentioned"," right"," away",".\n","Small"," Giants"," will"," be"," a"," series"," of"," posts"," on"," Better","WP",".net","..."," more","\n","As"," a"," Word","Press"," end","-users",","," you"," might"," never"," care"," about"," the"," term"," \"","Memory"," Usage","\""," until"," you"," encounter"," a"," fatal"," error"," that"," keeps"," your"," site"," from"," working"," normally",".\n","Memory"," Usage"," (","in"," Word","Press","'s"," case",")"," is"," used"," to"," refer"," to"," how"," much"," CPU"," memory"," your"," PHP"," scripts"," (","plugins",","," themes",","," and"," Word","Press"," core"," files",")"," consume"," when"," they"," get"," parsed","."," Word","Press","'s"," core"," files"," (","Twenty"," Ten"," theme"," installed",")"," consumes"," about"," ","13","MB"," of"," memory"," (","on"," some"," hosts"," with"," added"," modules"," or"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Non-Chat","maxValue":44.65625,"maxValueTokenIndex":256,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,44.65625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null},{"id":"vjpnnzboftjopivdtt85gos2","tokens":["<|startoftext|>","Mal","heureusement",","," cette"," page"," n","'est"," actuellement"," pas"," encore"," disponible"," en"," français","."," Nous"," ne"," pouvons"," vous"," transmettre"," cette"," information"," qu","'en"," anglais"," pour"," le"," moment","."," Merci"," de"," votre"," compréhension",".\n","C","ines","c","apes"," -"," atmospheric"," sound","sc","apes","\n","C","ines","c","apes"," offers"," you"," a"," versatile"," toolbox"," for"," creating"," sound"," environments"," for"," diverse"," moods",","," as"," well"," as"," ready"," to"," go"," sound","sc","apes"," and"," rh","yt","mic"," ambience"," elements","."," The"," sound"," pal","lette"," for"," C","ines","c","apes"," is"," mostly"," sourced"," from"," their"," organic",","," analog"," and"," ambience","/","field"," recordings",".\n","In"," this"," ","1",".","6"," Gb"," library",","," you"," will"," find"," ","90","+"," stems"," from"," ","25","+"," sc","apes",","," organised"," into"," Kontakt"," presets"," Dark",","," T","ense",","," Dream","y",","," Mel","anch","oly",","," Hope",","," Mystic",","," World","."," Mult","is","ample"," solo"," instruments"," and"," a"," “","noise"," and"," amb","iences","”"," preset"," is"," also"," included"," letting"," you"," access"," all"," noise","&","amb","ience"," stems","."," Also",","," the"," stem"," files"," are"," labeled"," as"," Ton","al",","," (","N",")","oise",","," (","B",")","ass",","," Lead"," etc","."," and"," their"," tone"," letters"," for"," those"," who"," prefer"," working"," with"," W","av"," files",".\n","Whether"," starting"," from"," scratch",","," breaking"," down"," or"," dropping"," a"," tonal","/no","ise"," backing"," on"," an"," already"," rolling"," track",";"," contributing"," to"," a"," story"," told"," by"," film"," or"," just"," sp","icing"," up"," some"," ambient"," or"," cross"," genre"," sound"," world"," of"," yours",","," Rast"," Sound"," believes"," there"," is"," something"," for"," you"," here",".\n","Please"," notice",":"," This"," library"," can"," not"," be"," used"," with"," the"," free"," Kontakt"," Player","!"," To"," use"," this"," \"","Open"," Kontakt","\""," format",","," you"," need"," a"," full"," version"," of"," Kontakt",","," which"," is"," included"," in"," products"," such"," as"," Kom","plete"," or"," Kom","plete"," Ultimate",".\n","The"," minimum"," required"," Kontakt"," version"," number"," for"," this"," product"," is"," stated"," in"," the"," product"],"dataIndex":null,"index":"74658","layer":"11-resid-post-aa","modelId":"gpt-oss-20b","dataSource":"Non-Chat","maxValue":43.0625,"maxValueTokenIndex":302,"minValue":0,"values":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,43.0625,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"dfaValues":[],"dfaTargetIndex":-1,"dfaMaxValue":0,"creatorId":"clkht01d40000jv08hvalcvly","createdAt":"$D2025-09-24T05:17:36.215Z","lossValues":[],"logitContributions":null,"binMin":-1,"binMax":-1,"binContains":-1,"qualifyingTokenIndex":null}],"explanations":[{"id":"hav7ju6mgxfgvh3pecllhk8xy","description":"_core","explanationModelName":"gemini-2.0-flash","typeName":"np_max-act","scores":[],"triggeredByUser":null}]},"embed":false,"embedPlots":true,"embedTest":true,"defaultTestText":"$undefined","embedTestField":true,"embedExplanation":true,"embedActivations":true,"embedLink":true,"embedSteer":true,"data-sentry-element":"FeatureDashboard","data-sentry-source-file":"page.tsx"}]}]

_core

No Comments

No Known Activations