Advertisement
Guest User

Untitled

a guest
Oct 17th, 2019
86
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 0.89 KB | None | 0 0
  1. import numpy as np
  2. import xgboost as xgb
  3. from xgboost import XGBRegressor, DMatrix
  4. import warnings
  5. warnings.filterwarnings('ignore')
  6.  
  7. text_columns = ['query_id', 'region', 'relevance', 'org_id', 'window_center', 'query', 'query_tokens', 'all_text_info', 'org_name']
  8.  
  9. X_train = train_df.drop(text_columns, axis=1)
  10. y_train = train_df['relevance']
  11. queries_train = train_df['query_id'].values
  12. xgtrain = DMatrix(X_train, label=y_train)
  13. xgtrain.set_group(train_df.groupby('relevance').apply(len).values)
  14.  
  15. X_test = test_df.drop(text_columns, axis=1)
  16. y_test = test_df['relevance'].values
  17. queries_test = test_df['query_id'].values
  18. xgtest = DMatrix(X_test, label=y_test)
  19. xgtest.set_group(test_df.groupby('relevance').apply(len).values)
  20.  
  21. bst = xgb.train({
  22. "objective": "rank:pairwise",
  23. "eval_metric": "ndcg@10",
  24. "silent": True
  25. }, xgtrain, num_boost_round=50)
  26.  
  27. print(bst.eval(xgtest))
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement