Untitled

mail@pastecode.io avatarunknown
plain_text
a month ago
1.5 kB
1
Indexable
Never
def input_evalution(input_processed_text, df_train_mtrx,tfidf_vector,df_act):
    print("Into Input Evaluation function")
    text=input_processed_text
    print("Text : ",text)
    tfidf_vector=tfidf_vector
    print("TFIDF Vector : ",tfidf_vector)
    df_train_mtrx=df_train_mtrx
    #print("DF Train Matrix : ",df_train_mtrx)
    
    input_tfidf=tfidf_vector.transform([text])
    print("Input TF IDF : ",input_tfidf)
    x=input_tfidf.todense()
    print("X : ",x)
    df_tst = pd.DataFrame(x)
    #print("Df Test Input Evaluation : ",df_tst)
    ## Replacing Nan values in matrix with 0
    df_train_mtrx_nan=np.isnan(df_train_mtrx)
    #print("DF Train MAtrix Nan : ",df_train_mtrx_nan)
    df_train_mtrx[df_train_mtrx_nan] = 0
    ## Appending df_tst to df_train
    #df_train_mtrx = df_train_mtrx.append(df_tst)
    #print("DF Train Matrix after appending : ",df_train_mtrx)
    ## Calculating Cosine Similarity-->issue
    scr=cosine_similarity(df_train_mtrx, df_tst)
    print("Cosine Similarity : ",scr)
    df_chk = pd.DataFrame()
    df_chk['ticket_id']=df_train_mtrx.index
    df_chk['score']=scr
    print("DF CHeck : ",df_chk.head())
    score = df_chk[(df_chk['score']>0.25) & (df_chk['ticket_id']!='test123')]['score'].tolist()
    print("Score : ",score)
    #print("DF ACt : ",df_act.head())
    df_eval = df_act[df_act['ticket_id'].isin(df_chk[df_chk['score']>0.25]['ticket_id'])]
    df_eval['score'] = score
    print("DF eval : ",df_eval)
    
    return df_eval,df_tst