ai_platform_report/ref.bib

@article{lecun1995convolutional,
	title={Convolutional networks for images, speech, and time series},
	author={LeCun, Yann and Bengio, Yoshua and others},
	journal={The handbook of brain theory and neural networks},
	volume={3361},
	number={10},
	pages={1995},
	year={1995},
	publisher={Cambridge, MA USA}
}

@article{2017Attention,
	author    = {Ashish Vaswani and
	Noam Shazeer and
	Niki Parmar and
	Jakob Uszkoreit and
	Llion Jones and
	Aidan N. Gomez and
	Lukasz Kaiser and
	Illia Polosukhin},
	title     = {Attention Is All You Need},
	journal   = {CoRR},
	volume    = {abs/1706.03762},
	year      = {2017},
	url       = {http://arxiv.org/abs/1706.03762},
	eprinttype = {arXiv},
	eprint    = {1706.03762},
	timestamp = {Sat, 23 Jan 2021 01:20:40 +0100},
	biburl    = {https://dblp.org/rec/journals/corr/VaswaniSPUJGKP17.bib},
	bibsource = {dblp computer science bibliography, https://dblp.org}
}

@online{kexuefm-7718,
	title={动手做个DialoGPT：基于LM的生成式多轮对话模型},
	author={苏剑林},
	year={2020},
	month={Sep},
	howpublished={\url{https://spaces.ac.cn/archives/7718}},
}

@online{kaggle,
	title={House Prices - Advanced Regression Techniques},
	howpublished={\url{https://www.kaggle.com/competitions/house-prices-advanced-regression-techniques/overview}},
}

@online{aliyun2018pose,
	title={计算机视觉方向简介 | 人体骨骼关键点检测综述},
	howpublished={\url{https://developer.aliyun.com/article/639017}},
}

@article{2020UNet,
	title={UNet++: Redesigning Skip Connections to Exploit Multiscale Features in Image Segmentation},
	author={ Zhou, Z.  and  Siddiquee, Mmr  and  Tajbakhsh, N.  and  Liang, J. },
	journal={IEEE Transactions on Medical Imaging},
	volume={39},
	number={6},
	pages={1856-1867},
	year={2020},
}
@dataset{jiang_hou_2021_5171712,
	author       = {Jiang Hou and
	Yao Ling and
	Liu Yujun},
	title        = {{Multi-resolution dataset for photovoltaic panel 
	segmentation from satellite and aerial imagery}},
	month        = aug,
	year         = 2021,
	note         = {{Data document can refer to the preprint https://es 
	sd.copernicus.org/preprints/essd-2021-270/}},
	publisher    = {Zenodo},
	version      = {v1.0},
	doi          = {10.5281/zenodo.5171712},
	url          = {https://doi.org/10.5281/zenodo.5171712}
}
@article{devlin2018bert,
	title={Bert: Pre-training of deep bidirectional transformers for language understanding},
	author={Devlin, Jacob and Chang, Ming-Wei and Lee, Kenton and Toutanova, Kristina},
	journal={arXiv preprint arXiv:1810.04805},
	year={2018}
}
@inproceedings{radford2021learning,
	title={Learning transferable visual models from natural language supervision},
	author={Radford, Alec and Kim, Jong Wook and Hallacy, Chris and Ramesh, Aditya and Goh, Gabriel and Agarwal, Sandhini and Sastry, Girish and Askell, Amanda and Mishkin, Pamela and Clark, Jack and others},
	booktitle={International Conference on Machine Learning},
	pages={8748--8763},
	year={2021},
	organization={PMLR}
}
@inproceedings{wang2020large,
	title={A large-scale chinese short-text conversation dataset},
	author={Wang, Yida and Ke, Pei and Zheng, Yinhe and Huang, Kaili and Jiang, Yong and Zhu, Xiaoyan and Huang, Minlie},
	booktitle={CCF International Conference on Natural Language Processing and Chinese Computing},
	pages={91--103},
	year={2020},
	organization={Springer}
}
@article{liu2017order,
	title={In-order transition-based constituent parsing},
	author={Liu, Jiangming and Zhang, Yue},
	journal={Transactions of the Association for Computational Linguistics},
	volume={5},
	pages={413--424},
	year={2017},
	publisher={MIT Press}
}
@inproceedings{he-choi-2021-stem,
	title = "The Stem Cell Hypothesis: Dilemma behind Multi-Task Learning with Transformer Encoders",
	author = "He, Han and Choi, Jinho D.",
	booktitle = "Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing",
	month = nov,
	year = "2021",
	address = "Online and Punta Cana, Dominican Republic",
	publisher = "Association for Computational Linguistics",
	url = "https://aclanthology.org/2021.emnlp-main.451",
	pages = "5555--5577",
	abstract = "Multi-task learning with transformer encoders (MTL) has emerged as a powerful technique to improve performance on closely-related tasks for both accuracy and efficiency while a question still remains whether or not it would perform as well on tasks that are distinct in nature. We first present MTL results on five NLP tasks, POS, NER, DEP, CON, and SRL, and depict its deficiency over single-task learning. We then conduct an extensive pruning analysis to show that a certain set of attention heads get claimed by most tasks during MTL, who interfere with one another to fine-tune those heads for their own objectives. Based on this finding, we propose the Stem Cell Hypothesis to reveal the existence of attention heads naturally talented for many tasks that cannot be jointly trained to create adequate embeddings for all of those tasks. Finally, we design novel parameter-free probes to justify our hypothesis and demonstrate how attention heads are transformed across the five tasks during MTL through label analysis.",
}
@online{zhinengyuyindongcha2020,
	title={智能语音专题（一）：智能语音交互的概念},
	howpublished={\url{https://zhuanlan.zhihu.com/p/109885562}},
}

@inproceedings{yao2021wenet,
	title={WeNet: Production oriented Streaming and Non-streaming End-to-End Speech Recognition Toolkit},
	author={Yao, Zhuoyuan and Wu, Di and Wang, Xiong and Zhang, Binbin and Yu, Fan and Yang, Chao and Peng, Zhendong and Chen, Xiaoyu and Xie, Lei and Lei, Xin},
	booktitle={Proc. Interspeech},
	year={2021},
	address={Brno, Czech Republic },
	organization={IEEE}
}
@article{Wei2019NEZHA,
	author    = {Junqiu Wei and
	Xiaozhe Ren and
	Xiaoguang Li and
	Wenyong Huang and
	Yi Liao and
	Yasheng Wang and
	Jiashu Lin and
	Xin Jiang and
	Xiao Chen and
	Qun Liu},
	title     = {{NEZHA:} Neural Contextualized Representation for Chinese Language
	Understanding},
	journal   = {CoRR},
	volume    = {abs/1909.00204},
	year      = {2019},
	url       = {http://arxiv.org/abs/1909.00204},
	eprinttype = {arXiv},
	eprint    = {1909.00204},
	timestamp = {Tue, 21 Dec 2021 15:05:23 +0100},
	biburl    = {https://dblp.org/rec/journals/corr/abs-1909-00204.bib},
	bibsource = {dblp computer science bibliography, https://dblp.org}
}
@online{kexuefm-7148,
	title={“非自回归”也不差：基于MLM的阅读理解问答},
	author={苏剑林},
	year={2019},
	month={Dec},
	howpublished={\url{https://spaces.ac.cn/archives/7148}},
}

@article{Li2016Dataset,
	title={Dataset and Neural Recurrent Sequence Labeling Model for Open-Domain Factoid Question Answering},
	author={ Li, P.  and  Li, W.  and  He, Z.  and  Wang, X.  and  Cao, Y.  and  Zhou, J.  and  Xu, W. },
	year={2016},
}
@online{cips2018sogou,
	title={CIPS-SOGOU问答比赛},
	howpublished={\url{http://task.www.sogou.com/cips-sogou_qa/}},
}
@misc{myhub2021tr,
	author={myhub},
	title={{tr - Text Recognition}},
	version={2.3.1},
	month=dec,
	year=2021,
	publisher={GithubRepository},
	howpublished={\url{github.com/myhub/tr}},
}

@article{Redmon2015YOLO,
	author    = {Joseph Redmon and
	Santosh Kumar Divvala and
	Ross B. Girshick and
	Ali Farhadi},
	title     = {You Only Look Once: Unified, Real-Time Object Detection},
	journal   = {CoRR},
	volume    = {abs/1506.02640},
	year      = {2015},
	url       = {http://arxiv.org/abs/1506.02640},
	eprinttype = {arXiv},
	eprint    = {1506.02640},
	timestamp = {Mon, 13 Aug 2018 16:48:08 +0200},
	biburl    = {https://dblp.org/rec/journals/corr/RedmonDGF15.bib},
	bibsource = {dblp computer science bibliography, https://dblp.org}
}

@software{glenn_jocher_2022_7002879,
	author       = {Glenn Jocher and
	Ayush Chaurasia and
	Alex Stoken and
	Jirka Borovec and
	NanoCode012 and
	Yonghye Kwon and
	TaoXie and
	Kalen Michael and
	Jiacong Fang and
	imyhxy and
	Lorna and
	Colin Wong and
	曾逸夫(Zeng Yifu) and
	Abhiram V and
	Diego Montes and
	Zhiqiang Wang and
	Cristi Fati and
	Jebastin Nadar and
	Laughing and
	UnglvKitDe and
	tkianai and
	yxNONG and
	Piotr Skalski and
	Adam Hogan and
	Max Strobel and
	Mrinal Jain and
	Lorenzo Mammana and
	xylieong},
	title        = {{ultralytics/yolov5: v6.2 - YOLOv5 Classification 
	Models, Apple M1, Reproducibility, ClearML and
	Deci.ai integrations}},
	month        = aug,
	year         = 2022,
	publisher    = {Zenodo},
	version      = {v6.2},
	doi          = {10.5281/zenodo.7002879},
	url          = {https://doi.org/10.5281/zenodo.7002879}
}

@article{Taylor2018Forecasting,
	title={Forecasting at Scale},
	author={Taylor and Sean and J. and Letham and Benjamin},
	journal={American Statistician},
	year={2018},
}

@article{chen2016xgboost,
	author    = {Tianqi Chen and
	Carlos Guestrin},
	title     = {XGBoost: {A} Scalable Tree Boosting System},
	journal   = {CoRR},
	volume    = {abs/1603.02754},
	year      = {2016},
	url       = {http://arxiv.org/abs/1603.02754},
	eprinttype = {arXiv},
	eprint    = {1603.02754},
	timestamp = {Mon, 13 Aug 2018 16:47:00 +0200},
	biburl    = {https://dblp.org/rec/journals/corr/ChenG16.bib},
	bibsource = {dblp computer science bibliography, https://dblp.org}
}