% Generated by IEEEtran.bst, version: 1.14 (2015/08/26) \begin{thebibliography}{10} \providecommand{\url}[1]{#1} \csname url@samestyle\endcsname \providecommand{\newblock}{\relax} \providecommand{\bibinfo}[2]{#2} \providecommand{\BIBentrySTDinterwordspacing}{\spaceskip=0pt\relax} \providecommand{\BIBentryALTinterwordstretchfactor}{4} \providecommand{\BIBentryALTinterwordspacing}{\spaceskip=\fontdimen2\font plus \BIBentryALTinterwordstretchfactor\fontdimen3\font minus \fontdimen4\font\relax} \providecommand{\BIBforeignlanguage}[2]{{% \expandafter\ifx\csname l@#1\endcsname\relax \typeout{** WARNING: IEEEtran.bst: No hyphenation pattern has been}% \typeout{** loaded for the language `#1'. Using the pattern for}% \typeout{** the default language instead.}% \else \language=\csname l@#1\endcsname \fi #2}} \providecommand{\BIBdecl}{\relax} \BIBdecl \bibitem{choi2020online} \BIBentryALTinterwordspacing H.~Choi, C.~F. Mela, S.~R. Balseiro, and A.~Leary, ``Online display advertising markets: A literature review and future directions.'' \emph{Inf. Syst. Res.}, vol.~31, no.~2, pp. 556--575, 2020. [Online]. Available: \url{http://dblp.uni-trier.de/db/journals/isr/isr31.html#ChoiMBL20} \BIBentrySTDinterwordspacing \bibitem{yuan2014survey} Y.~Yuan, F.~Wang, J.~Li, and R.~Qin, ``A survey on real time bidding advertising,'' in \emph{Proceedings of 2014 IEEE International Conference on Service Operations and Logistics, and Informatics}, 2014, pp. 418--423. \bibitem{qin2019revenue} \BIBentryALTinterwordspacing R.~Qin, X.~Ni, Y.~Yuan, J.~Li, and F.-Y. Wang, ``Revenue models for demand side platforms in real time bidding advertising.'' in \emph{SMC}.\hskip 1em plus 0.5em minus 0.4em\relax IEEE, 2017, pp. 438--443. [Online]. Available: \url{http://dblp.uni-trier.de/db/conf/smc/smc2017.html#QinNYLW17} \BIBentrySTDinterwordspacing \bibitem{reference/ml/LingS17} \BIBentryALTinterwordspacing C.~X. Ling and V.~S. Sheng, ``Class imbalance problem.'' in \emph{Encyclopedia of Machine Learning and Data Mining}, C.~Sammut and G.~I. Webb, Eds.\hskip 1em plus 0.5em minus 0.4em\relax Springer, 2017, pp. 204--205. [Online]. Available: \url{http://dblp.uni-trier.de/db/reference/ml/ml2017.html#LingS17} \BIBentrySTDinterwordspacing \bibitem{pires2019high} A.~M. Pires and J.~A. Branco, ``High dimensionality: The latest challenge to data analysis,'' 2019. \bibitem{journals/eswa/LikaKH14} \BIBentryALTinterwordspacing B.~Lika, K.~Kolomvatsos, and S.~Hadjiefthymiades, ``Facing the cold start problem in recommender systems.'' \emph{Expert Syst. Appl.}, vol.~41, no.~4, pp. 2065--2073, 2014. [Online]. Available: \url{http://dblp.uni-trier.de/db/journals/eswa/eswa41.html#LikaKH14} \BIBentrySTDinterwordspacing \bibitem{DBLP:journals/corr/abs-1004-3732} \BIBentryALTinterwordspacing Z.~Zhang, C.~Liu, Y.~Zhang, and T.~Zhou, ``Solving the cold-start problem in recommender systems with social tags,'' \emph{CoRR}, vol. abs/1004.3732, 2010. [Online]. Available: \url{http://arxiv.org/abs/1004.3732} \BIBentrySTDinterwordspacing \bibitem{boser1992} \BIBentryALTinterwordspacing B.~E. Boser, I.~M. Guyon, and V.~N. Vapnik, ``A training algorithm for optimal margin classifiers,'' in \emph{Proceedings of the 5th Annual Workshop on Computational Learning Theory (COLT'92)}, D.~Haussler, Ed.\hskip 1em plus 0.5em minus 0.4em\relax Pittsburgh, PA, USA: ACM Press, July 1992, pp. 144--152. [Online]. Available: \url{http://doi.acm.org/10.1145/130385.130401} \BIBentrySTDinterwordspacing \bibitem{Gai_piecewise} \BIBentryALTinterwordspacing K.~Gai, X.~Zhu, H.~Li, K.~Liu, and Z.~Wang, ``Learning piece-wise linear models from large scale data for ad click prediction.'' \emph{CoRR}, vol. abs/1704.05194, 2017. [Online]. Available: \url{http://dblp.uni-trier.de/db/journals/corr/corr1704.html#GaiZLLW17} \BIBentrySTDinterwordspacing \bibitem{lecun_sgd} Y.~LeCun, L.~Bottou, Y.~Bengio, and P.~Haffner, ``Gradient-based learning applied to document recognition,'' \emph{Proceedings of the IEEE}, vol.~86, no.~11, pp. 2278--2324, 1998. \bibitem{lbfgs_2008} \BIBentryALTinterwordspacing Y.~Xiao, Z.~Wei, and Z.~Wang, ``A limited memory bfgs-type method for large-scale unconstrained optimization.'' \emph{Comput. Math. Appl.}, vol.~56, no.~4, pp. 1001--1009, 2008. [Online]. Available: \url{http://dblp.uni-trier.de/db/journals/cma/cma56.html#XiaoWW08} \BIBentrySTDinterwordspacing \bibitem{Graepel_2010} \BIBentryALTinterwordspacing T.~Graepel, J.~Q. Candela, T.~Borchert, and R.~Herbrich, ``Web-scale bayesian click-through rate prediction for sponsored search advertising in microsoft's bing search engine.'' in \emph{ICML}, J.~Fürnkranz and T.~Joachims, Eds.\hskip 1em plus 0.5em minus 0.4em\relax Omnipress, 2010, pp. 13--20. [Online]. Available: \url{http://dblp.uni-trier.de/db/conf/icml/icml2010.html#GraepelCBH10} \BIBentrySTDinterwordspacing \bibitem{Rendle:2010ja} \BIBentryALTinterwordspacing S.~Rendle, ``{Factorization Machines},'' in \emph{Proceedings of the 2010 IEEE International Conference on Data Mining}, ser. ICDM '10.\hskip 1em plus 0.5em minus 0.4em\relax IEEE, Dec. 2010, pp. 995--1000. [Online]. Available: \url{http://ieeexplore.ieee.org/document/5694074/} \BIBentrySTDinterwordspacing \bibitem{Juan_fieldawarefm1} \BIBentryALTinterwordspacing Y.-C. Juan, Y.~Zhuang, W.-S. Chin, and C.-J. Lin, ``Field-aware factorization machines for ctr prediction.'' in \emph{RecSys}, S.~Sen, W.~Geyer, J.~Freyne, and P.~Castells, Eds.\hskip 1em plus 0.5em minus 0.4em\relax ACM, 2016, pp. 43--50. [Online]. Available: \url{http://dblp.uni-trier.de/db/conf/recsys/recsys2016.html#JuanZCL16} \BIBentrySTDinterwordspacing \bibitem{Juan_fieldawarefm2} \BIBentryALTinterwordspacing Y.~Juan, D.~Lefortier, and O.~Chapelle, ``Field-aware factorization machines in a real-world online advertising system.'' \emph{CoRR}, vol. abs/1701.04099, 2017. [Online]. Available: \url{http://dblp.uni-trier.de/db/journals/corr/corr1701.html#JuanLC17} \BIBentrySTDinterwordspacing \bibitem{Pan_fieldweightedfm} \BIBentryALTinterwordspacing J.~Pan, J.~Xu, A.~L. Ruiz, W.~Zhao, S.~Pan, Y.~Sun, and Q.~Lu, ``Field-weighted factorization machines for click-through rate prediction in display advertising.'' \emph{CoRR}, vol. abs/1806.03514, 2018. [Online]. Available: \url{http://dblp.uni-trier.de/db/journals/corr/corr1806.html#abs-1806-03514} \BIBentrySTDinterwordspacing \bibitem{Freudenthaler2011BayesianFM} S.-T.~L. Freudenthaler, C. and S.~Rendle, ``Bayesian factorization machines,'' in \emph{In Proceedings of the NIPS Workshop on Sparse Representation and Low-rank Approximation}, 2011. \bibitem{Pan_sparsefm} \BIBentryALTinterwordspacing Z.~Pan, E.~Chen, Q.~Liu, T.~Xu, H.~Ma, and H.~Lin, ``Sparse factorization machines for click-through rate prediction.'' in \emph{ICDM}, F.~Bonchi, J.~Domingo-Ferrer, R.~Baeza-Yates, Z.-H. Zhou, and X.~Wu, Eds.\hskip 1em plus 0.5em minus 0.4em\relax IEEE Computer Society, 2016, pp. 400--409. [Online]. Available: \url{http://dblp.uni-trier.de/db/conf/icdm/icdm2016.html#PanCLXML16} \BIBentrySTDinterwordspacing \bibitem{Xiao_afm} \BIBentryALTinterwordspacing J.~Xiao, H.~Ye, X.~He, H.~Zhang, F.~Wu, and T.-S. Chua, ``Attentional factorization machines: Learning the weight of feature interactions via attention networks.'' \emph{CoRR}, vol. abs/1708.04617, 2017. [Online]. Available: \url{http://dblp.uni-trier.de/db/journals/corr/corr1708.html#abs-1708-04617} \BIBentrySTDinterwordspacing \bibitem{srivastava2014dropout} \BIBentryALTinterwordspacing N.~Srivastava, G.~Hinton, A.~Krizhevsky, I.~Sutskever, and R.~Salakhutdinov, ``{Dropout: A Simple Way to Prevent Neural Networks from Overfitting},'' \emph{J. Mach. Learn. Res.}, vol.~15, no.~1, pp. 1929--1958, Jan. 2014. [Online]. Available: \url{http://portal.acm.org/citation.cfm?id=2670313} \BIBentrySTDinterwordspacing \bibitem{tikhonov1943stability} A.~N. Tikhonov, ``On the stability of inverse problems,'' in \emph{Dokl. Akad. Nauk SSSR}, vol.~39, 1943, pp. 195--198. \bibitem{journals/corr/ZhangYS17aa} \BIBentryALTinterwordspacing S.~Zhang, L.~Yao, and A.~Sun, ``Deep learning based recommender system: A survey and new perspectives.'' \emph{CoRR}, vol. abs/1707.07435, 2017. [Online]. Available: \url{http://dblp.uni-trier.de/db/journals/corr/corr1707.html#ZhangYS17aa} \BIBentrySTDinterwordspacing \bibitem{Chen_deepctr} \BIBentryALTinterwordspacing J.~Chen, B.~Sun, H.~Li, H.~Lu, and X.-S. Hua, ``Deep ctr prediction in display advertising.'' in \emph{ACM Multimedia}, A.~Hanjalic, C.~Snoek, M.~Worring, D.~C.~A. Bulterman, B.~Huet, A.~Kelliher, Y.~Kompatsiaris, and J.~Li, Eds.\hskip 1em plus 0.5em minus 0.4em\relax ACM, 2016, pp. 811--820. [Online]. Available: \url{http://dblp.uni-trier.de/db/conf/mm/mm2016.html#ChenSLLH16} \BIBentrySTDinterwordspacing \bibitem{he2015residual} \BIBentryALTinterwordspacing K.~He, X.~Zhang, S.~Ren, and J.~Sun, ``Deep residual learning for image recognition,'' 2015, cite arxiv:1512.03385Comment: Tech report. [Online]. Available: \url{http://arxiv.org/abs/1512.03385} \BIBentrySTDinterwordspacing \bibitem{Nair_relu} \BIBentryALTinterwordspacing V.~Nair and G.~E. Hinton, ``Rectified linear units improve restricted boltzmann machines.'' in \emph{ICML}, J.~Fürnkranz and T.~Joachims, Eds.\hskip 1em plus 0.5em minus 0.4em\relax Omnipress, 2010, pp. 807--814. [Online]. Available: \url{http://dblp.uni-trier.de/db/conf/icml/icml2010.html#NairH10} \BIBentrySTDinterwordspacing \bibitem{Guo_embedding_2016} \BIBentryALTinterwordspacing C.~Guo and F.~Berkhahn, ``Entity embeddings of categorical variables.'' \emph{CoRR}, vol. abs/1604.06737, 2016. [Online]. Available: \url{http://dblp.uni-trier.de/db/journals/corr/corr1604.html#GuoB16} \BIBentrySTDinterwordspacing \bibitem{ioffe2015batch} \BIBentryALTinterwordspacing S.~Ioffe and C.~Szegedy, ``Batch normalization: Accelerating deep network training by reducing internal covariate shift,'' 2015, cite arxiv:1502.03167. [Online]. Available: \url{http://arxiv.org/abs/1502.03167} \BIBentrySTDinterwordspacing \bibitem{Guo_deepfm1} \BIBentryALTinterwordspacing H.~Guo, R.~Tang, Y.~Ye, Z.~Li, and X.~He, ``Deepfm: A factorization-machine based neural network for ctr prediction.'' in \emph{IJCAI}, C.~Sierra, Ed.\hskip 1em plus 0.5em minus 0.4em\relax ijcai.org, 2017, pp. 1725--1731. [Online]. Available: \url{http://dblp.uni-trier.de/db/conf/ijcai/ijcai2017.html#GuoTYLH17} \BIBentrySTDinterwordspacing \bibitem{Guo_deepfm2} \BIBentryALTinterwordspacing H.~Guo, R.~Tang, Y.~Ye, Z.~Li, X.~He, and Z.~Dong, ``Deepfm: An end-to-end wide and deep learning framework for ctr prediction.'' \emph{CoRR}, vol. abs/1804.04950, 2018. [Online]. Available: \url{http://dblp.uni-trier.de/db/journals/corr/corr1804.html#abs-1804-04950} \BIBentrySTDinterwordspacing \bibitem{Cheng_wideanddeep} \BIBentryALTinterwordspacing H.-T. Cheng, L.~Koc, J.~Harmsen, T.~Shaked, T.~Chandra, H.~Aradhye, G.~Anderson, G.~Corrado, W.~Chai, M.~Ispir, R.~Anil, Z.~Haque, L.~Hong, V.~Jain, X.~Liu, and H.~Shah, ``Wide and deep learning for recommender systems.'' in \emph{DLRS@RecSys}, A.~Karatzoglou, B.~Hidasi, D.~Tikk, O.~S. Shalom, H.~Roitman, B.~Shapira, and L.~Rokach, Eds.\hskip 1em plus 0.5em minus 0.4em\relax ACM, 2016, pp. 7--10. [Online]. Available: \url{http://dblp.uni-trier.de/db/conf/recsys/dlrs2016.html#Cheng0HSCAACCIA16} \BIBentrySTDinterwordspacing \bibitem{Wang_asae} \BIBentryALTinterwordspacing Q.~Wang, F.~Liu, S.~Xing, and X.~Zhao, ``A new approach for advertising ctr prediction based on deep neural network via attention mechanism.'' \emph{Comput. Math. Methods Medicine}, vol. 2018, pp. 8\,056\,541:1--8\,056\,541:11, 2018. [Online]. Available: \url{http://dblp.uni-trier.de/db/journals/cmmm/cmmm2018.html#WangLXZ18} \BIBentrySTDinterwordspacing \bibitem{Ballard_autoencoder} \BIBentryALTinterwordspacing D.~H. Ballard, ``Modular learning in neural networks.'' in \emph{AAAI}, K.~D. Forbus and H.~E. Shrobe, Eds.\hskip 1em plus 0.5em minus 0.4em\relax Morgan Kaufmann, 1987, pp. 279--284. [Online]. Available: \url{http://dblp.uni-trier.de/db/conf/aaai/aaai87.html#Ballard87} \BIBentrySTDinterwordspacing \bibitem{ShannonWeaver49} C.~E. Shannon and W.~Weaver, \emph{The Mathematical Theory of Communication}.\hskip 1em plus 0.5em minus 0.4em\relax Urbana and Chicago: University of Illinois Press, 1949. \bibitem{Naumov_embedding_dim} \BIBentryALTinterwordspacing M.~Naumov, ``On the dimensionality of embeddings for sparse features and data.'' \emph{CoRR}, vol. abs/1901.02103, 2019. [Online]. Available: \url{http://dblp.uni-trier.de/db/journals/corr/corr1901.html#abs-1901-02103} \BIBentrySTDinterwordspacing \bibitem{Ginart_MixedDimEmb} \BIBentryALTinterwordspacing A.~Ginart, M.~Naumov, D.~Mudigere, J.~Yang, and J.~Zou, ``Mixed dimension embeddings with application to memory-efficient recommendation systems.'' \emph{CoRR}, vol. abs/1909.11810, 2019. [Online]. Available: \url{http://dblp.uni-trier.de/db/journals/corr/corr1909.html#abs-1909-11810} \BIBentrySTDinterwordspacing \bibitem{he2017neural} \BIBentryALTinterwordspacing X.~He, L.~Liao, H.~Zhang, L.~Nie, X.~Hu, and T.-S. Chua, ``Neural collaborative filtering,'' in \emph{Proceedings of the 26th International Conference on World Wide Web}, ser. WWW ’17.\hskip 1em plus 0.5em minus 0.4em\relax Republic and Canton of Geneva, CHE: International World Wide Web Conferences Steering Committee, 2017, p. 173–182. [Online]. Available: \url{https://doi.org/10.1145/3038912.3052569} \BIBentrySTDinterwordspacing \bibitem{maas2013leakyrelu} A.~L. Maas, A.~Y. Hannun, and A.~Y. Ng, ``Rectifier nonlinearities improve neural network acoustic models,'' in \emph{Proc. icml}, vol.~30, no.~1.\hskip 1em plus 0.5em minus 0.4em\relax Citeseer, 2013, p.~3. \bibitem{t-sne} \BIBentryALTinterwordspacing L.~van~der Maaten and G.~Hinton, ``Visualizing data using {t-SNE},'' \emph{Journal of Machine Learning Research}, vol.~9, pp. 2579--2605, 2008. [Online]. Available: \url{http://www.jmlr.org/papers/v9/vandermaaten08a.html} \BIBentrySTDinterwordspacing \end{thebibliography}