这是indexloc提供的服务,不要输入任何密码

BibTeX records: Zhao Song 0002

download as .bib file

@article{DBLP:journals/siamcomp/RubinsteinSSS25,
  author       = {Aviad Rubinstein and
                  Saeed Seddighin and
                  Zhao Song and
                  Xiaorui Sun},
  title        = {Approximation Algorithms for {LCS} and {LIS} with Truly Improved Running
                  Times},
  journal      = {{SIAM} J. Comput.},
  volume       = {54},
  number       = {4},
  pages        = {S19--276},
  year         = {2025}
}
@inproceedings{DBLP:conf/aaai/Shen000L000KDS025,
  author       = {Xuan Shen and
                  Zhao Song and
                  Yufa Zhou and
                  Bo Chen and
                  Yanyu Li and
                  Yifan Gong and
                  Kai Zhang and
                  Hao Tan and
                  Jason Kuen and
                  Henghui Ding and
                  Zhihao Shu and
                  Wei Niu and
                  Pu Zhao and
                  Yanzhi Wang and
                  Jiuxiang Gu},
  title        = {LazyDiT: Lazy Learning for the Acceleration of Diffusion Transformers},
  booktitle    = {{AAAI}},
  pages        = {20409--20417},
  publisher    = {{AAAI} Press},
  year         = {2025}
}
@inproceedings{DBLP:conf/aaai/Shen000L0R00CZ025,
  author       = {Xuan Shen and
                  Zhao Song and
                  Yufa Zhou and
                  Bo Chen and
                  Jing Liu and
                  Ruiyi Zhang and
                  Ryan A. Rossi and
                  Hao Tan and
                  Tong Yu and
                  Xiang Chen and
                  Yufan Zhou and
                  Tong Sun and
                  Pu Zhao and
                  Yanzhi Wang and
                  Jiuxiang Gu},
  title        = {Numerical Pruning for Efficient Autoregressive Models},
  booktitle    = {{AAAI}},
  pages        = {20418--20426},
  publisher    = {{AAAI} Press},
  year         = {2025}
}
@inproceedings{DBLP:conf/aistats/LiLSSZ25,
  author       = {Chenyang Li and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song and
                  Tianyi Zhou},
  title        = {Fourier Circuits in Neural Networks and Transformers: {A} Case Study
                  of Modular Arithmetic with Multiple Inputs},
  booktitle    = {{AISTATS}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {258},
  pages        = {523--531},
  publisher    = {{PMLR}},
  year         = {2025}
}
@inproceedings{DBLP:conf/aistats/GaoSY25,
  author       = {Yeqi Gao and
                  Zhao Song and
                  Junze Yin},
  title        = {An Iterative Algorithm for Rescaled Hyperbolic Functions Regression},
  booktitle    = {{AISTATS}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {258},
  pages        = {2548--2556},
  publisher    = {{PMLR}},
  year         = {2025}
}
@inproceedings{DBLP:conf/aistats/LiangSSSZ25,
  author       = {Yingyu Liang and
                  Zhizhou Sha and
                  Zhenmei Shi and
                  Zhao Song and
                  Yufa Zhou},
  title        = {Looped ReLU MLPs May Be All You Need as Practical Programmable Computers},
  booktitle    = {{AISTATS}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {258},
  pages        = {2647--2655},
  publisher    = {{PMLR}},
  year         = {2025}
}
@inproceedings{DBLP:conf/aistats/LiLSS25,
  author       = {Chenyang Li and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song},
  title        = {When Can We Solve the Weighted Low Rank Approximation Problem in Truly
                  Subquadratic Time?},
  booktitle    = {{AISTATS}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {258},
  pages        = {2710--2718},
  publisher    = {{PMLR}},
  year         = {2025}
}
@inproceedings{DBLP:conf/aistats/ChenLLSS25,
  author       = {Bo Chen and
                  Xiaoyu Li and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song},
  title        = {Bypassing the Exponential Dependency: Looped Transformers Efficiently
                  Learn In-context by Multi-step Gradient Descent},
  booktitle    = {{AISTATS}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {258},
  pages        = {4447--4455},
  publisher    = {{PMLR}},
  year         = {2025}
}
@inproceedings{DBLP:conf/cpal/LiLSSY25,
  author       = {Xiaoyu Li and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song and
                  Junwei Yu},
  title        = {Fast John Ellipsoid Computation with Differential Privacy Optimization},
  booktitle    = {{CPAL}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {280},
  pages        = {24--64},
  publisher    = {{PMLR}},
  year         = {2025}
}
@inproceedings{DBLP:conf/cpal/ChenLSSS25,
  author       = {Bo Chen and
                  Yingyu Liang and
                  Zhizhou Sha and
                  Zhenmei Shi and
                  Zhao Song},
  title        = {HSR-Enhanced Sparse Attention Acceleration},
  booktitle    = {{CPAL}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {280},
  pages        = {105--133},
  publisher    = {{PMLR}},
  year         = {2025}
}
@inproceedings{DBLP:conf/cpal/DaliriSY25,
  author       = {Majid Daliri and
                  Zhao Song and
                  Chiwun Yang},
  title        = {Unlock the Theory behind Scaling 1-bit Neural Networks},
  booktitle    = {{CPAL}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {280},
  pages        = {545--598},
  publisher    = {{PMLR}},
  year         = {2025}
}
@inproceedings{DBLP:conf/cpal/KeLSSY25,
  author       = {Yekun Ke and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song and
                  Chiwun Yang},
  title        = {Curse of Attention: {A} Kernel-Based Perspective for Why Transformers
                  Fail to Generalize on Time Series Forecasting and Beyond},
  booktitle    = {{CPAL}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {280},
  pages        = {675--738},
  publisher    = {{PMLR}},
  year         = {2025}
}
@inproceedings{DBLP:conf/cpal/ChenLLSS25,
  author       = {Yifang Chen and
                  Xiaoyu Li and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song},
  title        = {The Computational Limits of State-Space Models and Mamba via the Lens
                  of Circuit Complexity},
  booktitle    = {{CPAL}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {280},
  pages        = {739--767},
  publisher    = {{PMLR}},
  year         = {2025}
}
@inproceedings{DBLP:conf/cpal/SongWYY25,
  author       = {Zhao Song and
                  Weixin Wang and
                  Chenbo Yin and
                  Junze Yin},
  title        = {Fast and Efficient Matching Algorithm with Deadline Instances},
  booktitle    = {{CPAL}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {280},
  pages        = {932--959},
  publisher    = {{PMLR}},
  year         = {2025}
}
@inproceedings{DBLP:conf/cpal/DengLSWZ25,
  author       = {Yichuan Deng and
                  Jiangxuan Long and
                  Zhao Song and
                  Zifan Wang and
                  Han Zhang},
  title        = {Streaming Kernel {PCA} Algorithm With Small Space},
  booktitle    = {{CPAL}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {280},
  pages        = {1216--1254},
  publisher    = {{PMLR}},
  year         = {2025}
}
@inproceedings{DBLP:conf/iclr/0002YY025,
  author       = {Zhao Song and
                  Mingquan Ye and
                  Junze Yin and
                  Lichen Zhang},
  title        = {Efficient Alternating Minimization with Applications to Weighted Low
                  Rank Approximation},
  booktitle    = {{ICLR}},
  publisher    = {OpenReview.net},
  year         = {2025}
}
@inproceedings{DBLP:conf/iclr/Gu0025,
  author       = {Yuzhou Gu and
                  Zhao Song and
                  Lichen Zhang},
  title        = {Faster Algorithms for Structured Linear and Kernel Support Vector
                  Machines},
  booktitle    = {{ICLR}},
  publisher    = {OpenReview.net},
  year         = {2025}
}
@inproceedings{DBLP:conf/iclr/HuSK0025,
  author       = {Jerry Yao{-}Chieh Hu and
                  Maojiang Su and
                  En{-}Jui Kuo and
                  Zhao Song and
                  Han Liu},
  title        = {Computational Limits of Low-Rank Adaptation (LoRA) Fine-Tuning for
                  Transformer Models},
  booktitle    = {{ICLR}},
  publisher    = {OpenReview.net},
  year         = {2025}
}
@inproceedings{DBLP:conf/iclr/HuWGL0025,
  author       = {Jerry Yao{-}Chieh Hu and
                  Wei{-}Po Wang and
                  Ammar Gilani and
                  Chenyang Li and
                  Zhao Song and
                  Han Liu},
  title        = {Fundamental Limits of Prompt Tuning Transformers: Universality, Capacity
                  and Efficiency},
  booktitle    = {{ICLR}},
  publisher    = {OpenReview.net},
  year         = {2025}
}
@inproceedings{DBLP:conf/iclr/LiangLS0025,
  author       = {Yingyu Liang and
                  Jiangxuan Long and
                  Zhenmei Shi and
                  Zhao Song and
                  Yufa Zhou},
  title        = {Beyond Linear Approximations: {A} Novel Pruning Approach for Attention
                  Matrix},
  booktitle    = {{ICLR}},
  publisher    = {OpenReview.net},
  year         = {2025}
}
@inproceedings{DBLP:conf/uai/ChenGLLSSSWY25,
  author       = {Bo Chen and
                  Chengyue Gong and
                  Xiaoyu Li and
                  Yingyu Liang and
                  Zhizhou Sha and
                  Zhenmei Shi and
                  Zhao Song and
                  Mingda Wan and
                  Xugang Ye},
  title        = {NRFlow: Towards Noise-Robust Generative Modeling via High-Order Mechanism},
  booktitle    = {{UAI}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {286},
  pages        = {673--704},
  publisher    = {{PMLR}},
  year         = {2025}
}
@inproceedings{DBLP:conf/uai/GaoSWY25,
  author       = {Yeqi Gao and
                  Zhao Song and
                  Weixin Wang and
                  Junze Yin},
  title        = {A Fast Optimization View: Reformulating Single Layer Attention in
                  {LLM} Based on Tensor and {SVM} Trick, and Solving It in Matrix Multiplication
                  Time},
  booktitle    = {{UAI}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {286},
  pages        = {1381--1452},
  publisher    = {{PMLR}},
  year         = {2025}
}
@inproceedings{DBLP:conf/uai/LiangSXYZ25,
  author       = {Jiehao Liang and
                  Zhao Song and
                  Zhaozhuo Xu and
                  Junze Yin and
                  Danyang Zhuo},
  title        = {Dynamic Maintenance of Kernel Density Estimation Data Structure: From
                  Practice to Theory},
  booktitle    = {{UAI}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {286},
  pages        = {2552--2581},
  publisher    = {{PMLR}},
  year         = {2025}
}
@inproceedings{DBLP:conf/wacv/GuLSS025,
  author       = {Jiuxiang Gu and
                  Yingyu Liang and
                  Zhizhou Sha and
                  Zhenmei Shi and
                  Zhao Song},
  title        = {Differential Privacy Mechanisms in Neural Tangent Kernel Regression},
  booktitle    = {{WACV}},
  pages        = {2342--2356},
  publisher    = {{IEEE}},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2501-04299,
  author       = {Yekun Ke and
                  Xiaoyu Li and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song},
  title        = {Circuit Complexity Bounds for Visual Autoregressive Model},
  journal      = {CoRR},
  volume       = {abs/2501.04299},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2501-04377,
  author       = {Yekun Ke and
                  Xiaoyu Li and
                  Yingyu Liang and
                  Zhizhou Sha and
                  Zhenmei Shi and
                  Zhao Song},
  title        = {On Computational Limits and Provably Efficient Criteria of Visual
                  Autoregressive Models: {A} Fine-Grained Complexity Analysis},
  journal      = {CoRR},
  volume       = {abs/2501.04377},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2501-05884,
  author       = {Dabing Cheng and
                  Haosen Zhan and
                  Xingchen Zhao and
                  Guisheng Liu and
                  Zemin Li and
                  Jinghui Xie and
                  Zhao Song and
                  Weiguo Feng and
                  Bingyue Peng},
  title        = {Text-to-Edit: Controllable End-to-End Video Ad Creation via Multimodal
                  LLMs},
  journal      = {CoRR},
  volume       = {abs/2501.05884},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2501-06444,
  author       = {Xiaoyu Li and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song and
                  Wei Wang and
                  Jiahao Zhang},
  title        = {On the Computational Capability of Graph Neural Networks: {A} Circuit
                  Complexity Bound Perspective},
  journal      = {CoRR},
  volume       = {abs/2501.06444},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2501-09982,
  author       = {Yuefan Cao and
                  Chengyue Gong and
                  Xiaoyu Li and
                  Yingyu Liang and
                  Zhizhou Sha and
                  Zhenmei Shi and
                  Zhao Song},
  title        = {RichSpace: Enriching Text-to-Video Prompt Space via Text Embedding
                  Interpolation},
  journal      = {CoRR},
  volume       = {abs/2501.09982},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2501-10688,
  author       = {Xiaoyu Li and
                  Yingyu Liang and
                  Jiangxuan Long and
                  Zhenmei Shi and
                  Zhao Song and
                  Zhen Zhuang},
  title        = {Neural Algorithmic Reasoning for Hypergraphs with Looped Transformers},
  journal      = {CoRR},
  volume       = {abs/2501.10688},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2502-00500,
  author       = {Yang Cao and
                  Zhao Song and
                  Chiwun Yang},
  title        = {Video Latent Flow Matching: Optimal Polynomial Projections for Video
                  Interpolation and Extrapolation},
  journal      = {CoRR},
  volume       = {abs/2502.00500},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2502-00688,
  author       = {Bo Chen and
                  Chengyue Gong and
                  Xiaoyu Li and
                  Yingyu Liang and
                  Zhizhou Sha and
                  Zhenmei Shi and
                  Zhao Song and
                  Mingda Wan},
  title        = {High-Order Matching for One-Step Shortcut Diffusion Models},
  journal      = {CoRR},
  volume       = {abs/2502.00688},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2502-00690,
  author       = {Yuefan Cao and
                  Xiaoyu Li and
                  Yingyu Liang and
                  Zhizhou Sha and
                  Zhenmei Shi and
                  Zhao Song and
                  Jiahao Zhang},
  title        = {Dissecting Submission Limit in Desk-Rejections: {A} Mathematical Analysis
                  of Fairness in {AI} Conference Policies},
  journal      = {CoRR},
  volume       = {abs/2502.00690},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2502-00693,
  author       = {Yekun Ke and
                  Yingyu Liang and
                  Zhizhou Sha and
                  Zhenmei Shi and
                  Zhao Song},
  title        = {DPBloomfilter: Securing Bloom Filters with Differential Privacy},
  journal      = {CoRR},
  volume       = {abs/2502.00693},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2502-06167,
  author       = {Yifang Chen and
                  Xiaoyu Li and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song},
  title        = {Universal Approximation of Visual Autoregressive Transformers},
  journal      = {CoRR},
  volume       = {abs/2502.06167},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2502-08150,
  author       = {Yang Cao and
                  Bo Chen and
                  Xiaoyu Li and
                  Yingyu Liang and
                  Zhizhou Sha and
                  Zhenmei Shi and
                  Zhao Song and
                  Mingda Wan},
  title        = {Force Matching with Relativistic Constraints: {A} Physics-Inspired
                  Approach to Stable and Efficient Generative Modeling},
  journal      = {CoRR},
  volume       = {abs/2502.08150},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2502-16490,
  author       = {Chengyue Gong and
                  Yekun Ke and
                  Xiaoyu Li and
                  Yingyu Liang and
                  Zhizhou Sha and
                  Zhenmei Shi and
                  Zhao Song},
  title        = {On Computational Limits of FlowAR Models: Expressivity and Efficiency},
  journal      = {CoRR},
  volume       = {abs/2502.16490},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2502-16912,
  author       = {Chenyang Li and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song},
  title        = {When Can We Solve the Weighted Low Rank Approximation Problem in Truly
                  Subquadratic Time?},
  journal      = {CoRR},
  volume       = {abs/2502.16912},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2503-01314,
  author       = {Yifang Chen and
                  Xuyang Guo and
                  Xiaoyu Li and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song},
  title        = {Scaling Law Phenomena Across Regression Paradigms: Multiple and Kernel
                  Approaches},
  journal      = {CoRR},
  volume       = {abs/2503.01314},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2503-06884,
  author       = {Yuefan Cao and
                  Xuyang Guo and
                  Jiayan Huo and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song and
                  Jiahao Zhang and
                  Zhen Zhuang},
  title        = {Text-to-Image Diffusion Models Cannot Count, and Prompt Refinement
                  Cannot Help},
  journal      = {CoRR},
  volume       = {abs/2503.06884},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2503-08032,
  author       = {Yingyu Liang and
                  Zhizhou Sha and
                  Zhenmei Shi and
                  Zhao Song and
                  Mingda Wan},
  title        = {{HOFAR:} High-Order Augmentation of Flow Autoregressive Transformers},
  journal      = {CoRR},
  volume       = {abs/2503.08032},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2503-09069,
  author       = {Chengyue Gong and
                  Xiaoyu Li and
                  Yingyu Liang and
                  Jiangxuan Long and
                  Zhenmei Shi and
                  Zhao Song and
                  Yu Tian},
  title        = {Theoretical Guarantees for High Order Trajectory Refinement in Generative
                  Flows},
  journal      = {CoRR},
  volume       = {abs/2503.09069},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2503-11108,
  author       = {Yifang Chen and
                  Xiaoyu Li and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song and
                  Yu Tian},
  title        = {Time and Memory Trade-off of KV-Cache Compression in Tensor Transformer
                  Decoding},
  journal      = {CoRR},
  volume       = {abs/2503.11108},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2503-14076,
  author       = {Jiangxuan Long and
                  Zhao Song and
                  Chiwun Yang},
  title        = {Theoretical Foundation of Flow-Based Time Series Generation: Provable
                  Approximation, Generalization, and Efficiency},
  journal      = {CoRR},
  volume       = {abs/2503.14076},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2503-14881,
  author       = {Bo Chen and
                  Xiaoyu Li and
                  Yekun Ke and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song},
  title        = {Exploring the Limits of {KV} Cache Compression in Visual Autoregressive
                  Transformers},
  journal      = {CoRR},
  volume       = {abs/2503.14881},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2504-04051,
  author       = {Xuyang Guo and
                  Zekai Huang and
                  Jiayan Huo and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song and
                  Jiahao Zhang},
  title        = {Can You Count to Nine? {A} Human Evaluation Benchmark for Counting
                  Limits in Modern Text-to-Video Models},
  journal      = {CoRR},
  volume       = {abs/2504.04051},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2504-04702,
  author       = {Bo Chen and
                  Zhenmei Shi and
                  Zhao Song and
                  Jiahao Zhang},
  title        = {Provable Failure of Language Models in Learning Majority Boolean Logic
                  via Gradient Descent},
  journal      = {CoRR},
  volume       = {abs/2504.04702},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2504-08542,
  author       = {Haoran Cheng and
                  Qide Dong and
                  Liang Peng and
                  Zhizhou Sha and
                  Weiguo Feng and
                  Jinghui Xie and
                  Zhao Song and
                  Shilei Wen and
                  Xiaofei He and
                  Boxi Wu},
  title        = {Discriminator-Free Direct Preference Optimization for Video Diffusion},
  journal      = {CoRR},
  volume       = {abs/2504.08542},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2504-19901,
  author       = {Hude Liu and
                  Jerry Yao{-}Chieh Hu and
                  Zhao Song and
                  Han Liu},
  title        = {Attention Mechanism, Max-Affine Partition, and Universal Approximation},
  journal      = {CoRR},
  volume       = {abs/2504.19901},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2505-00337,
  author       = {Xuyang Guo and
                  Jiayan Huo and
                  Zhenmei Shi and
                  Zhao Song and
                  Jiahao Zhang and
                  Jiale Zhao},
  title        = {T2VPhysBench: {A} First-Principles Benchmark for Physical Consistency
                  in Text-to-Video Generation},
  journal      = {CoRR},
  volume       = {abs/2505.00337},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2505-04946,
  author       = {Xuyang Guo and
                  Jiayan Huo and
                  Zhenmei Shi and
                  Zhao Song and
                  Jiahao Zhang and
                  Jiale Zhao},
  title        = {T2VTextBench: {A} Human Evaluation Benchmark for Textual Control in
                  Video Generation Models},
  journal      = {CoRR},
  volume       = {abs/2505.04946},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2505-11892,
  author       = {Josh Alman and
                  Zhao Song},
  title        = {Fast RoPE Attention: Combining the Polynomial Method and Fast Fourier
                  Transform},
  journal      = {CoRR},
  volume       = {abs/2505.11892},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2505-16284,
  author       = {Josh Alman and
                  Zhao Song},
  title        = {Only Large Weights (And Not Skip Connections) Can Prevent the Perils
                  of Rank Collapse},
  journal      = {CoRR},
  volume       = {abs/2505.16284},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2505-19531,
  author       = {Jerry Yao{-}Chieh Hu and
                  Xiwen Zhang and
                  Maojiang Su and
                  Zhao Song and
                  Han Liu},
  title        = {Minimalist Softmax Attention Provably Learns Constrained Boolean Functions},
  journal      = {CoRR},
  volume       = {abs/2505.19531},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2506-05503,
  author       = {Shiyuan Feng and
                  Ying Feng and
                  George Z. Li and
                  Zhao Song and
                  David P. Woodruff and
                  Lichen Zhang},
  title        = {On Differential Privacy for Adaptively Solving Search Problems via
                  Sketching},
  journal      = {CoRR},
  volume       = {abs/2506.05503},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2506-20141,
  author       = {Xiaoyu Li and
                  Zhao Song and
                  Jiahao Zhang},
  title        = {Accept More, Reject Less: Reducing up to 19{\%} Unnecessary Desk-Rejections
                  over 11 Years of {ICLR} Data},
  journal      = {CoRR},
  volume       = {abs/2506.20141},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2507-17699,
  author       = {Zhao Song and
                  Song Yue and
                  Jiahao Zhang},
  title        = {Thinking Isn't an Illusion: Overcoming the Limitations of Reasoning
                  Models via Tool Augmentations},
  journal      = {CoRR},
  volume       = {abs/2507.17699},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2507-18107,
  author       = {Yubin Chen and
                  Xuyang Guo and
                  Zhenmei Shi and
                  Zhao Song and
                  Jiahao Zhang},
  title        = {T2VWorldBench: {A} Benchmark for Evaluating World Knowledge in Text-to-Video
                  Generation},
  journal      = {CoRR},
  volume       = {abs/2507.18107},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2508-06004,
  author       = {Weihang Guo and
                  Zhao Song and
                  Jiahao Zhang},
  title        = {When a Paper Has 1000 Authors: Rethinking Citation Metrics in the
                  Era of LLMs},
  journal      = {CoRR},
  volume       = {abs/2508.06004},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2508-07102,
  author       = {Yang Cao and
                  Yubin Chen and
                  Zhao Song and
                  Jiahao Zhang},
  title        = {Towards High-Order Mean Flow Generative Models: Feasibility, Expressivity,
                  and Provably Efficient Criteria},
  journal      = {CoRR},
  volume       = {abs/2508.07102},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2508-13214,
  author       = {Xuyang Guo and
                  Zekai Huang and
                  Zhao Song and
                  Jiahao Zhang},
  title        = {Too Easily Fooled? Prompt Injection Breaks LLMs on Frustratingly Simple
                  Multiple-Choice Questions},
  journal      = {CoRR},
  volume       = {abs/2508.13214},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2509-16801,
  author       = {Zhao Song and
                  David P. Woodruff and
                  Lichen Zhang},
  title        = {Sublinear Time Quantum Sensitivity Sampling},
  journal      = {CoRR},
  volume       = {abs/2509.16801},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2509-16915,
  author       = {Zhao Song and
                  Jianfei Xue and
                  Lichen Zhang},
  title        = {Differential Privacy for Euclidean Jordan Algebra with Applications
                  to Private Symmetric Cone Programming},
  journal      = {CoRR},
  volume       = {abs/2509.16915},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2509-21473,
  author       = {Hude Liu and
                  Jerry Yao{-}Chieh Hu and
                  Jennifer Yuntong Zhang and
                  Zhao Song and
                  Han Liu},
  title        = {Are Hallucinations Bad Estimations?},
  journal      = {CoRR},
  volume       = {abs/2509.21473},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2509-22623,
  author       = {Maojiang Su and
                  Mingcheng Lu and
                  Jerry Yao{-}Chieh Hu and
                  Shang Wu and
                  Zhao Song and
                  Alex Daniel Reneau and
                  Han Liu},
  title        = {A Theoretical Analysis of Discrete Flow Matching Generative Models},
  journal      = {CoRR},
  volume       = {abs/2509.22623},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2510-03678,
  author       = {Zhao Song and
                  Shenghao Xie and
                  Samson Zhou},
  title        = {Towards Sampling Data Structures for Tensor Products in Turnstile
                  Streams},
  journal      = {CoRR},
  volume       = {abs/2510.03678},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2510-04401,
  author       = {Xuyang Guo and
                  Zekai Huang and
                  Zhenmei Shi and
                  Zhao Song and
                  Jiahao Zhang},
  title        = {Your Vision-Language Model Can't Even Count to 20: Exposing the Failures
                  of VLMs in Compositional Counting},
  journal      = {CoRR},
  volume       = {abs/2510.04401},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2510-05494,
  author       = {Yang Cao and
                  Zhao Song and
                  Jiahao Zhang and
                  Jiale Zhao},
  title        = {Fundamental Limits of Crystalline Equivariant Graph Neural Networks:
                  {A} Circuit Complexity Perspective},
  journal      = {CoRR},
  volume       = {abs/2510.05494},
  year         = {2025}
}
@article{DBLP:journals/corr/abs-2510-22816,
  author       = {Honghao Lin and
                  Zhao Song and
                  David P. Woodruff and
                  Shenghao Xie and
                  Samson Zhou},
  title        = {L\({}_{\mbox{p}}\) Sampling in Distributed Data Streams with Applications
                  to Adversarial Robustness},
  journal      = {CoRR},
  volume       = {abs/2510.22816},
  year         = {2025}
}
@inproceedings{DBLP:conf/aaai/Chu0Y24,
  author       = {Timothy Chu and
                  Zhao Song and
                  Chiwun Yang},
  title        = {How to Protect Copyright Data in Optimization of Large Language Models?},
  booktitle    = {{AAAI}},
  pages        = {17871--17879},
  publisher    = {{AAAI} Press},
  year         = {2024}
}
@inproceedings{DBLP:conf/aistats/0002Y024,
  author       = {Zhao Song and
                  Junze Yin and
                  Lichen Zhang},
  title        = {Solving Attention Kernel Regression Problem via Pre-conditioner},
  booktitle    = {{AISTATS}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {238},
  pages        = {208--216},
  publisher    = {{PMLR}},
  year         = {2024}
}
@inproceedings{DBLP:conf/aistats/0002Y0024,
  author       = {Zhao Song and
                  Junze Yin and
                  Lichen Zhang and
                  Ruizhe Zhang},
  title        = {Fast Dynamic Sampling for Determinantal Point Processes},
  booktitle    = {{AISTATS}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {238},
  pages        = {244--252},
  publisher    = {{PMLR}},
  year         = {2024}
}
@inproceedings{DBLP:conf/aistats/Qin0024,
  author       = {Lianke Qin and
                  Zhao Song and
                  Ruizhe Zhang},
  title        = {A General Algorithm for Solving Rank-one Matrix Sensing},
  booktitle    = {{AISTATS}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {238},
  pages        = {757--765},
  publisher    = {{PMLR}},
  year         = {2024}
}
@inproceedings{DBLP:conf/bigdataconf/0002LM024,
  author       = {Yichuan Deng and
                  Zhihang Li and
                  Sridhar Mahadevan and
                  Zhao Song},
  title        = {Zero-th Order Algorithm for Softmax Attention Optimization},
  booktitle    = {{IEEE} Big Data},
  pages        = {24--33},
  publisher    = {{IEEE}},
  year         = {2024}
}
@inproceedings{DBLP:conf/bigdataconf/Ke00Z24,
  author       = {Yekun Ke and
                  Xiaoyu Li and
                  Zhao Song and
                  Tianyi Zhou},
  title        = {Faster Sampling Algorithms for Polytopes with Small Treewidth},
  booktitle    = {{IEEE} Big Data},
  pages        = {44--53},
  publisher    = {{IEEE}},
  year         = {2024}
}
@inproceedings{DBLP:conf/bigdataconf/0001L0Z24,
  author       = {Xiaoyu Li and
                  Jiangxuan Long and
                  Zhao Song and
                  Tianyi Zhou},
  title        = {Fast Second-order Method for Neural Networks under Small Treewidth
                  Setting},
  booktitle    = {{IEEE} Big Data},
  pages        = {1029--1038},
  publisher    = {{IEEE}},
  year         = {2024}
}
@inproceedings{DBLP:conf/bigdataconf/Qin0024,
  author       = {Lianke Qin and
                  Zhao Song and
                  Yuanyuan Yang},
  title        = {Efficient {SGD} Neural Network Training via Sublinear Activated Neuron
                  Identification},
  booktitle    = {{IEEE} Big Data},
  pages        = {1413--1427},
  publisher    = {{IEEE}},
  year         = {2024}
}
@inproceedings{DBLP:conf/iclr/Alman024,
  author       = {Josh Alman and
                  Zhao Song},
  title        = {How to Capture Higher-order Correlations? Generalizing Matrix Softmax
                  Attention to Kronecker Computation},
  booktitle    = {{ICLR}},
  publisher    = {OpenReview.net},
  year         = {2024}
}
@inproceedings{DBLP:conf/iclr/GaoQ0W24,
  author       = {Yeqi Gao and
                  Lianke Qin and
                  Zhao Song and
                  Yitan Wang},
  title        = {A Sublinear Adversarial Training Algorithm},
  booktitle    = {{ICLR}},
  publisher    = {OpenReview.net},
  year         = {2024}
}
@inproceedings{DBLP:conf/iclr/Gu0Y024,
  author       = {Yuzhou Gu and
                  Zhao Song and
                  Junze Yin and
                  Lichen Zhang},
  title        = {Low Rank Matrix Completion via Robust Alternating Minimization in
                  Nearly Linear Time},
  booktitle    = {{ICLR}},
  publisher    = {OpenReview.net},
  year         = {2024}
}
@inproceedings{DBLP:conf/icml/Brand0024,
  author       = {Jan van den Brand and
                  Zhao Song and
                  Tianyi Zhou},
  title        = {Algorithm and Hardness for Dynamic Attention Maintenance in Large
                  Language Models},
  booktitle    = {{ICML}},
  publisher    = {OpenReview.net},
  year         = {2024}
}
@inproceedings{DBLP:conf/icml/HuL0L24,
  author       = {Jerry Yao{-}Chieh Hu and
                  Thomas Lin and
                  Zhao Song and
                  Han Liu},
  title        = {On Computational Limits of Modern Hopfield Models: {A} Fine-Grained
                  Complexity Analysis},
  booktitle    = {{ICML}},
  publisher    = {OpenReview.net},
  year         = {2024}
}
@inproceedings{DBLP:conf/innovations/00020024,
  author       = {Zhao Song and
                  Lichen Zhang and
                  Ruizhe Zhang},
  title        = {Training Multi-Layer Over-Parametrized Neural Network in Subquadratic
                  Time},
  booktitle    = {{ITCS}},
  series       = {LIPIcs},
  volume       = {287},
  pages        = {93:1--93:15},
  publisher    = {Schloss Dagstuhl - Leibniz-Zentrum f{\"{u}}r Informatik},
  year         = {2024}
}
@inproceedings{DBLP:conf/nips/0002VWZ24,
  author       = {Zhao Song and
                  Ali Vakilian and
                  David P. Woodruff and
                  Samson Zhou},
  title        = {On Socially Fair Low-Rank Approximation and Column Subset Selection},
  booktitle    = {NeurIPS},
  year         = {2024}
}
@inproceedings{DBLP:conf/nips/Alman024,
  author       = {Josh Alman and
                  Zhao Song},
  title        = {The Fine-Grained Complexity of Gradient Computation for Training Large
                  Language Models},
  booktitle    = {NeurIPS},
  year         = {2024}
}
@inproceedings{DBLP:conf/nips/ChuAMNS024,
  author       = {Timothy Chu and
                  Josh Alman and
                  Gary L. Miller and
                  Shyam Narayanan and
                  Mark Sellke and
                  Zhao Song},
  title        = {Metric Transforms and Low Rank Representations of Kernels for Fast
                  Attention},
  booktitle    = {NeurIPS},
  year         = {2024}
}
@inproceedings{DBLP:conf/nips/GuKM0024,
  author       = {Yuzhou Gu and
                  Nikki Lijing Kuang and
                  Yian Ma and
                  Zhao Song and
                  Lichen Zhang},
  title        = {Log-concave Sampling from a Convex Body with a Barrier: a Robust and
                  Unified Dikin Walk},
  booktitle    = {NeurIPS},
  year         = {2024}
}
@inproceedings{DBLP:conf/nips/HuWLP0L24,
  author       = {Jerry Yao{-}Chieh Hu and
                  Weimin Wu and
                  Zhuoru Li and
                  Sophia Pi and
                  Zhao Song and
                  Han Liu},
  title        = {On Statistical Rates and Provably Efficient Criteria of Latent Diffusion
                  Transformers (DiTs)},
  booktitle    = {NeurIPS},
  year         = {2024}
}
@inproceedings{DBLP:conf/nips/Li0X0024,
  author       = {Shuai Li and
                  Zhao Song and
                  Yu Xia and
                  Tong Yu and
                  Tianyi Zhou},
  title        = {The Closeness of In-Context Learning and Weight Shifting for Softmax
                  Regression},
  booktitle    = {NeurIPS},
  year         = {2024}
}
@inproceedings{DBLP:conf/soda/JiangLSZ24,
  author       = {Haotian Jiang and
                  Yin Tat Lee and
                  Zhao Song and
                  Lichen Zhang},
  title        = {Convex Minimization with Integer Minima in \emph{{\~{O}}}(\emph{n}\({}^{\mbox{4}}\))
                  Time},
  booktitle    = {{SODA}},
  pages        = {3659--3684},
  publisher    = {{SIAM}},
  year         = {2024}
}
@inproceedings{DBLP:conf/uai/DengZM0L24,
  author       = {Wei Deng and
                  Qian Zhang and
                  Yian Ma and
                  Zhao Song and
                  Guang Lin},
  title        = {On Convergence of Federated Averaging Langevin Dynamics},
  booktitle    = {{UAI}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {244},
  pages        = {1022--1054},
  publisher    = {{PMLR}},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2402-01515,
  author       = {Yichuan Deng and
                  Zhao Song and
                  Chiwun Yang},
  title        = {Enhancing Stochastic Gradient Descent: {A} Unified Framework and Novel
                  Acceleration Methods for Faster Convergence},
  journal      = {CoRR},
  volume       = {abs/2402.01515},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2402-04497,
  author       = {Josh Alman and
                  Zhao Song},
  title        = {The Fine-Grained Complexity of Gradient Computation for Training Large
                  Language Models},
  journal      = {CoRR},
  volume       = {abs/2402.04497},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2402-04520,
  author       = {Jerry Yao{-}Chieh Hu and
                  Thomas Lin and
                  Zhao Song and
                  Han Liu},
  title        = {On Computational Limits of Modern Hopfield Models: {A} Fine-Grained
                  Complexity Analysis},
  journal      = {CoRR},
  volume       = {abs/2402.04520},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2402-07027,
  author       = {Yeqi Gao and
                  Zhao Song and
                  Ruizhe Zhang},
  title        = {Quantum Speedup for Spectral Approximation of Kronecker Products},
  journal      = {CoRR},
  volume       = {abs/2402.07027},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2402-09469,
  author       = {Jiuxiang Gu and
                  Chenyang Li and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song and
                  Tianyi Zhou},
  title        = {Fourier Circuits in Neural Networks: Unlocking the Potential of Large
                  Language Models in Mathematical Reasoning and Modular Arithmetic},
  journal      = {CoRR},
  volume       = {abs/2402.09469},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2404-02690,
  author       = {Yichuan Deng and
                  Zhao Song and
                  Chiwun Yang},
  title        = {Attention is Naturally Sparse with Gaussian Distributed Input},
  journal      = {CoRR},
  volume       = {abs/2404.02690},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2404-13785,
  author       = {Zhihang Li and
                  Zhao Song and
                  Weixin Wang and
                  Junze Yin and
                  Zheng Yu},
  title        = {How to Inverting the Leverage Score Distribution?},
  journal      = {CoRR},
  volume       = {abs/2404.13785},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2405-03251,
  author       = {Jiuxiang Gu and
                  Chenyang Li and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song},
  title        = {Exploring the Frontiers of Softmax: Provable Optimization, Applications
                  in Diffusion Model, and Beyond},
  journal      = {CoRR},
  volume       = {abs/2405.03251},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2405-05219,
  author       = {Jiuxiang Gu and
                  Yingyu Liang and
                  Heshan Liu and
                  Zhenmei Shi and
                  Zhao Song and
                  Junze Yin},
  title        = {Conv-Basis: {A} New Paradigm for Efficient Attention Inference and
                  Gradient Computation in Transformers},
  journal      = {CoRR},
  volume       = {abs/2405.05219},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2405-06003,
  author       = {Yeqi Gao and
                  Yuzhou Gu and
                  Zhao Song},
  title        = {Binary Hypothesis Testing for Softmax Models and Leverage Score Models},
  journal      = {CoRR},
  volume       = {abs/2405.06003},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2405-16411,
  author       = {Jiuxiang Gu and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song and
                  Yufa Zhou},
  title        = {Tensor Attention Training: Provably Efficient Learning of Higher-order
                  Transformers},
  journal      = {CoRR},
  volume       = {abs/2405.16411},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2405-16418,
  author       = {Jiuxiang Gu and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song and
                  Yufa Zhou},
  title        = {Unraveling the Smoothness Properties of Diffusion Models: {A} Gaussian
                  Mixture Perspective},
  journal      = {CoRR},
  volume       = {abs/2405.16418},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2406-03136,
  author       = {Jerry Yao{-}Chieh Hu and
                  Maojiang Su and
                  En{-}Jui Kuo and
                  Zhao Song and
                  Han Liu},
  title        = {Computational Limits of Low-Rank Adaptation (LoRA) for Transformer-Based
                  Models},
  journal      = {CoRR},
  volume       = {abs/2406.03136},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2406-14036,
  author       = {Jiuxiang Gu and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song and
                  Chiwun Yang},
  title        = {Toward Infinite-Long Prefix in Transformer},
  journal      = {CoRR},
  volume       = {abs/2406.14036},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2407-01079,
  author       = {Jerry Yao{-}Chieh Hu and
                  Weimin Wu and
                  Zhuoru Li and
                  Zhao Song and
                  Han Liu},
  title        = {On Statistical Rates and Provably Efficient Criteria of Latent Diffusion
                  Transformers (DiTs)},
  journal      = {CoRR},
  volume       = {abs/2407.01079},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2407-13621,
  author       = {Jiuxiang Gu and
                  Yingyu Liang and
                  Zhizhou Sha and
                  Zhenmei Shi and
                  Zhao Song},
  title        = {Differential Privacy Mechanisms in Neural Tangent Kernel Regression},
  journal      = {CoRR},
  volume       = {abs/2407.13621},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2407-14717,
  author       = {Jiuxiang Gu and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song and
                  Yufa Zhou},
  title        = {Differential Privacy of Cross-Attention with Provable Guarantee},
  journal      = {CoRR},
  volume       = {abs/2407.14717},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2408-06395,
  author       = {Jiuxiang Gu and
                  Xiaoyu Li and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song and
                  Junwei Yu},
  title        = {Fast John Ellipsoid Computation with Differential Privacy Optimization},
  journal      = {CoRR},
  volume       = {abs/2408.06395},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2408-11267,
  author       = {Chenyang Li and
                  Zhao Song and
                  Zhaoxing Xu and
                  Junze Yin},
  title        = {Inverting the Leverage Score Gradient: An Efficient Approximate Newton
                  Method},
  journal      = {CoRR},
  volume       = {abs/2408.11267},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2408-12151,
  author       = {Xiaoyu Li and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song},
  title        = {A Tighter Complexity Analysis of SparseGPT},
  journal      = {CoRR},
  volume       = {abs/2408.12151},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2408-13233,
  author       = {Yingyu Liang and
                  Zhizhou Sha and
                  Zhenmei Shi and
                  Zhao Song and
                  Yufa Zhou},
  title        = {Multi-Layer Transformers Gradient Can be Approximated in Almost Linear
                  Time},
  journal      = {CoRR},
  volume       = {abs/2408.13233},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2408-14018,
  author       = {Xiaoyu Li and
                  Zhao Song and
                  Junwei Yu},
  title        = {Quantum Speedups for Approximating the John Ellipsoid},
  journal      = {CoRR},
  volume       = {abs/2408.14018},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2409-01688,
  author       = {Erzhi Liu and
                  Jerry Yao{-}Chieh Hu and
                  Alex Daniel Reneau and
                  Zhao Song and
                  Han Liu},
  title        = {Differentially Private Kernel Density Estimation},
  journal      = {CoRR},
  volume       = {abs/2409.01688},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2410-05700,
  author       = {Yuzhou Gu and
                  Nikki Lijing Kuang and
                  Yi{-}An Ma and
                  Zhao Song and
                  Lichen Zhang},
  title        = {Log-concave Sampling over a Convex Body with a Barrier: a Robust and
                  Unified Dikin Walk},
  journal      = {CoRR},
  volume       = {abs/2410.05700},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2410-09375,
  author       = {Yingyu Liang and
                  Zhizhou Sha and
                  Zhenmei Shi and
                  Zhao Song and
                  Yufa Zhou},
  title        = {Looped ReLU MLPs May Be All You Need as Practical Programmable Computers},
  journal      = {CoRR},
  volume       = {abs/2410.09375},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2410-09397,
  author       = {Xiaoyu Li and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song and
                  Yufa Zhou},
  title        = {Fine-grained Attention {I/O} Complexity: Comprehensive Analysis for
                  Backward Passes},
  journal      = {CoRR},
  volume       = {abs/2410.09397},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2410-10165,
  author       = {Bo Chen and
                  Yingyu Liang and
                  Zhizhou Sha and
                  Zhenmei Shi and
                  Zhao Song},
  title        = {HSR-Enhanced Sparse Attention Acceleration},
  journal      = {CoRR},
  volume       = {abs/2410.10165},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2410-11261,
  author       = {Yingyu Liang and
                  Jiangxuan Long and
                  Zhenmei Shi and
                  Zhao Song and
                  Yufa Zhou},
  title        = {Beyond Linear Approximations: {A} Novel Pruning Approach for Attention
                  Matrix},
  journal      = {CoRR},
  volume       = {abs/2410.11261},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2410-11268,
  author       = {Bo Chen and
                  Xiaoyu Li and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song},
  title        = {Bypassing the Exponential Dependency: Looped Transformers Efficiently
                  Learn In-context by Multi-step Gradient Descent},
  journal      = {CoRR},
  volume       = {abs/2410.11268},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2410-11279,
  author       = {Yekun Ke and
                  Xiaoyu Li and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song},
  title        = {Advancing the Understanding of Fixed Point Iterations in Deep Neural
                  Networks: {A} Detailed Analytical Study},
  journal      = {CoRR},
  volume       = {abs/2410.11279},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2411-01663,
  author       = {Majid Daliri and
                  Zhao Song and
                  Chiwun Yang},
  title        = {Unlocking the Theory Behind Scaling 1-Bit Neural Networks},
  journal      = {CoRR},
  volume       = {abs/2411.01663},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2411-05750,
  author       = {Jerry Yao{-}Chieh Hu and
                  Erzhi Liu and
                  Han Liu and
                  Zhao Song and
                  Lichen Zhang},
  title        = {On Differentially Private String Distances},
  journal      = {CoRR},
  volume       = {abs/2411.05750},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2411-07602,
  author       = {Bo Chen and
                  Xiaoyu Li and
                  Yingyu Liang and
                  Jiangxuan Long and
                  Zhenmei Shi and
                  Zhao Song},
  title        = {Circuit Complexity Bounds for RoPE-based Transformer Architecture},
  journal      = {CoRR},
  volume       = {abs/2411.07602},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2411-16525,
  author       = {Jerry Yao{-}Chieh Hu and
                  Wei{-}Po Wang and
                  Ammar Gilani and
                  Chenyang Li and
                  Zhao Song and
                  Han Liu},
  title        = {Fundamental Limits of Prompt Tuning Transformers: Universality, Capacity
                  and Efficiency},
  journal      = {CoRR},
  volume       = {abs/2411.16525},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2411-16549,
  author       = {Weimin Wu and
                  Maojiang Su and
                  Jerry Yao{-}Chieh Hu and
                  Zhao Song and
                  Han Liu},
  title        = {Transformers are Deep Optimizers: Provable In-Context Learning for
                  Deep Model Training},
  journal      = {CoRR},
  volume       = {abs/2411.16549},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2412-05562,
  author       = {Xiaoyu Li and
                  Yuanpeng Li and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song},
  title        = {On the Expressive Power of Modern Hopfield Networks},
  journal      = {CoRR},
  volume       = {abs/2412.05562},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2412-06061,
  author       = {Yekun Ke and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song and
                  Chiwun Yang},
  title        = {Curse of Attention: {A} Kernel-Based Perspective for Why Transformers
                  Fail to Generalize on Time Series Forecasting and Beyond},
  journal      = {CoRR},
  volume       = {abs/2412.06061},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2412-06063,
  author       = {Zhao Song and
                  Ali Vakilian and
                  David P. Woodruff and
                  Samson Zhou},
  title        = {On Socially Fair Low-Rank Approximation and Column Subset Selection},
  journal      = {CoRR},
  volume       = {abs/2412.06063},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2412-06148,
  author       = {Yifang Chen and
                  Xiaoyu Li and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song},
  title        = {The Computational Limits of State-Space Models and Mamba via the Lens
                  of Circuit Complexity},
  journal      = {CoRR},
  volume       = {abs/2412.06148},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2412-12441,
  author       = {Xuan Shen and
                  Zhao Song and
                  Yufa Zhou and
                  Bo Chen and
                  Jing Liu and
                  Ruiyi Zhang and
                  Ryan A. Rossi and
                  Hao Tan and
                  Tong Yu and
                  Xiang Chen and
                  Yufan Zhou and
                  Tong Sun and
                  Pu Zhao and
                  Yanzhi Wang and
                  Jiuxiang Gu},
  title        = {Numerical Pruning for Efficient Autoregressive Models},
  journal      = {CoRR},
  volume       = {abs/2412.12441},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2412-12444,
  author       = {Xuan Shen and
                  Zhao Song and
                  Yufa Zhou and
                  Bo Chen and
                  Yanyu Li and
                  Yifan Gong and
                  Kai Zhang and
                  Hao Tan and
                  Jason Kuen and
                  Henghui Ding and
                  Zhihao Shu and
                  Wei Niu and
                  Pu Zhao and
                  Yanzhi Wang and
                  Jiuxiang Gu},
  title        = {LazyDiT: Lazy Learning for the Acceleration of Diffusion Transformers},
  journal      = {CoRR},
  volume       = {abs/2412.12444},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2412-17107,
  author       = {Yang Cao and
                  Xiaoyu Li and
                  Zhao Song},
  title        = {Grams: Gradient Descent with Adaptive Momentum Scaling},
  journal      = {CoRR},
  volume       = {abs/2412.17107},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2412-17316,
  author       = {Yifang Chen and
                  Jiayan Huo and
                  Xiaoyu Li and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song},
  title        = {Fast Gradient Computation for RoPE Attention in Almost Linear Time},
  journal      = {CoRR},
  volume       = {abs/2412.17316},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2412-18040,
  author       = {Xiaoyu Li and
                  Yingyu Liang and
                  Zhenmei Shi and
                  Zhao Song and
                  Mingda Wan},
  title        = {Theoretical Constraints on the Expressive Power of RoPE-based Tensor
                  Attention Transformers},
  journal      = {CoRR},
  volume       = {abs/2412.18040},
  year         = {2024}
}
@inproceedings{DBLP:conf/aaai/Wang0TM23,
  author       = {Kai Wang and
                  Zhao Song and
                  Georgios Theocharous and
                  Sridhar Mahadevan},
  title        = {Smoothed Online Combinatorial Optimization Using Imperfect Predictions},
  booktitle    = {{AAAI}},
  pages        = {12130--12137},
  publisher    = {{AAAI} Press},
  year         = {2023}
}
@inproceedings{DBLP:conf/aistats/Qin00Z23,
  author       = {Lianke Qin and
                  Zhao Song and
                  Lichen Zhang and
                  Danyang Zhuo},
  title        = {An Online and Unified Algorithm for Projection Matrix Vector Multiplication
                  with Application to Empirical Risk Minimization},
  booktitle    = {{AISTATS}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {206},
  pages        = {101--156},
  publisher    = {{PMLR}},
  year         = {2023}
}
@inproceedings{DBLP:conf/aistats/Xu0S23,
  author       = {Zhaozhuo Xu and
                  Zhao Song and
                  Anshumali Shrivastava},
  title        = {A Tale of Two Efficient Value Iteration Algorithms for Solving Linear
                  MDPs with Large Action Space},
  booktitle    = {{AISTATS}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {206},
  pages        = {788--836},
  publisher    = {{PMLR}},
  year         = {2023}
}
@inproceedings{DBLP:conf/bigdataconf/DengGS23,
  author       = {Yichuan Deng and
                  Yeqi Gao and
                  Zhao Song},
  title        = {Solving Tensor Low Cycle Rank Approximation},
  booktitle    = {{IEEE} Big Data},
  pages        = {6--16},
  publisher    = {{IEEE}},
  year         = {2023}
}
@inproceedings{DBLP:conf/bigdataconf/QinRS23,
  author       = {Lianke Qin and
                  Aravind Reddy and
                  Zhao Song},
  title        = {Online Adaptive Mahalanobis Distance Estimation},
  booktitle    = {{IEEE} Big Data},
  pages        = {56--65},
  publisher    = {{IEEE}},
  year         = {2023}
}
@inproceedings{DBLP:conf/bigdataconf/QinMSYZ23,
  author       = {Lianke Qin and
                  Saayan Mitra and
                  Zhao Song and
                  Yuanyuan Yang and
                  Tianyi Zhou},
  title        = {Fast Heavy Inner Product Identification Between Weights and Inputs
                  in Neural Network Training},
  booktitle    = {{IEEE} Big Data},
  pages        = {128--133},
  publisher    = {{IEEE}},
  year         = {2023}
}
@inproceedings{DBLP:conf/focs/00020W023,
  author       = {Zhao Song and
                  Baocheng Sun and
                  Omri Weinstein and
                  Ruizhe Zhang},
  title        = {Quartic Samples Suffice for Fourier Interpolation},
  booktitle    = {{FOCS}},
  pages        = {1414--1425},
  publisher    = {{IEEE}},
  year         = {2023}
}
@inproceedings{DBLP:conf/icalp/Liu0Z0023,
  author       = {S. Cliff Liu and
                  Zhao Song and
                  Hengjie Zhang and
                  Lichen Zhang and
                  Tianyi Zhou},
  title        = {Space-Efficient Interior Point Method, with Applications to Linear
                  Programming and Maximum Weight Bipartite Matching},
  booktitle    = {{ICALP}},
  series       = {LIPIcs},
  volume       = {261},
  pages        = {88:1--88:14},
  publisher    = {Schloss Dagstuhl - Leibniz-Zentrum f{\"{u}}r Informatik},
  year         = {2023}
}
@inproceedings{DBLP:conf/icml/Li0Y23,
  author       = {Xiaoxiao Li and
                  Zhao Song and
                  Jiaming Yang},
  title        = {Federated Adversarial Learning: {A} Framework with Convergence Analysis},
  booktitle    = {{ICML}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {19932--19959},
  publisher    = {{PMLR}},
  year         = {2023}
}
@inproceedings{DBLP:conf/icml/LiuWDZY0S0TRC23,
  author       = {Zichang Liu and
                  Jue Wang and
                  Tri Dao and
                  Tianyi Zhou and
                  Binhang Yuan and
                  Zhao Song and
                  Anshumali Shrivastava and
                  Ce Zhang and
                  Yuandong Tian and
                  Christopher R{\'{e}} and
                  Beidi Chen},
  title        = {Deja Vu: Contextual Sparsity for Efficient LLMs at Inference Time},
  booktitle    = {{ICML}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {22137--22176},
  publisher    = {{PMLR}},
  year         = {2023}
}
@inproceedings{DBLP:conf/icml/0002WY023,
  author       = {Zhao Song and
                  Yitan Wang and
                  Zheng Yu and
                  Lichen Zhang},
  title        = {Sketching for First Order Method: Efficient Algorithm for Low-Bandwidth
                  Channel and Vulnerability},
  booktitle    = {{ICML}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {32365--32417},
  publisher    = {{PMLR}},
  year         = {2023}
}
@inproceedings{DBLP:conf/icml/000200023,
  author       = {Zhao Song and
                  Xin Yang and
                  Yuanyuan Yang and
                  Lichen Zhang},
  title        = {Sketching Meets Differential Privacy: Fast Algorithm for Dynamic Kronecker
                  Projection Maintenance},
  booktitle    = {{ICML}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {32418--32462},
  publisher    = {{PMLR}},
  year         = {2023}
}
@inproceedings{DBLP:conf/icml/0002YY023,
  author       = {Zhao Song and
                  Mingquan Ye and
                  Junze Yin and
                  Lichen Zhang},
  title        = {A Nearly-Optimal Bound for Fast Regression with {\(\mathscr{l}\)}\({}_{\mbox{{\(\infty\)}}}\)
                  Guarantee},
  booktitle    = {{ICML}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {32463--32482},
  publisher    = {{PMLR}},
  year         = {2023}
}
@inproceedings{DBLP:conf/nips/Alman023,
  author       = {Josh Alman and
                  Zhao Song},
  title        = {Fast Attention Requires Bounded Entries},
  booktitle    = {NeurIPS},
  year         = {2023}
}
@inproceedings{DBLP:conf/nips/AlmanL00Z23,
  author       = {Josh Alman and
                  Jiehao Liang and
                  Zhao Song and
                  Ruizhe Zhang and
                  Danyang Zhuo},
  title        = {Bypass Exponential Time Preprocessing: Fast Neural Network Training
                  via Weight-Data Correlation Preprocessing},
  booktitle    = {NeurIPS},
  year         = {2023}
}
@inproceedings{DBLP:conf/nips/ChanpuriyaRRML023,
  author       = {Sudhanshu Chanpuriya and
                  Ryan A. Rossi and
                  Anup B. Rao and
                  Tung Mai and
                  Nedim Lipka and
                  Zhao Song and
                  Cameron Musco},
  title        = {Exact Representation of Sparse Networks with Symmetric Nonnegative
                  Embeddings},
  booktitle    = {NeurIPS},
  year         = {2023}
}
@inproceedings{DBLP:conf/nips/WuYW0ZZL0H23,
  author       = {Junda Wu and
                  Tong Yu and
                  Rui Wang and
                  Zhao Song and
                  Ruiyi Zhang and
                  Handong Zhao and
                  Chaochao Lu and
                  Shuai Li and
                  Ricardo Henao},
  title        = {InfoPrompt: Information-Theoretic Soft Prompt Tuning for Natural Language
                  Understanding},
  booktitle    = {NeurIPS},
  year         = {2023}
}
@inproceedings{DBLP:conf/nips/Zhang00CZC0TRBW23,
  author       = {Zhenyu Zhang and
                  Ying Sheng and
                  Tianyi Zhou and
                  Tianlong Chen and
                  Lianmin Zheng and
                  Ruisi Cai and
                  Zhao Song and
                  Yuandong Tian and
                  Christopher R{\'{e}} and
                  Clark W. Barrett and
                  Zhangyang Wang and
                  Beidi Chen},
  title        = {{H2O:} Heavy-Hitter Oracle for Efficient Generative Inference of Large
                  Language Models},
  booktitle    = {NeurIPS},
  year         = {2023}
}
@inproceedings{DBLP:conf/soda/0001KPS0Y23,
  author       = {Lijie Chen and
                  Gillat Kol and
                  Dmitry Paramonov and
                  Raghuvansh R. Saxena and
                  Zhao Song and
                  Huacheng Yu},
  title        = {Towards Multi-Pass Streaming Lower Bounds for Optimal Approximation
                  of Max-Cut},
  booktitle    = {{SODA}},
  pages        = {878--924},
  publisher    = {{SIAM}},
  year         = {2023}
}
@inproceedings{DBLP:conf/soda/JinL023,
  author       = {Yaonan Jin and
                  Daogao Liu and
                  Zhao Song},
  title        = {Super-resolution and Robust Sparse Continuous Fourier Transform in
                  Any Constant Dimension: Nearly Linear Time and Sample Complexity},
  booktitle    = {{SODA}},
  pages        = {4667--4767},
  publisher    = {{SIAM}},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2301-06741,
  author       = {Zhao Song and
                  Tianyi Zhou},
  title        = {Faster Sinkhorn's Algorithm with Small Treewidth},
  journal      = {CoRR},
  volume       = {abs/2301.06741},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2302-00248,
  author       = {Zhao Song and
                  Mingquan Ye and
                  Junze Yin and
                  Lichen Zhang},
  title        = {A Nearly-Optimal Bound for Fast Regression with {\unicode{120001}}\({}_{\mbox{{\(\infty\)}}}\)
                  Guarantee},
  journal      = {CoRR},
  volume       = {abs/2302.00248},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2302-11068,
  author       = {Yuzhou Gu and
                  Zhao Song and
                  Junze Yin and
                  Lichen Zhang},
  title        = {Low Rank Matrix Completion via Robust Alternating Minimization in
                  Nearly Linear Time},
  journal      = {CoRR},
  volume       = {abs/2302.11068},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2302-13214,
  author       = {Josh Alman and
                  Zhao Song},
  title        = {Fast Attention Requires Bounded Entries},
  journal      = {CoRR},
  volume       = {abs/2302.13214},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2303-04555,
  author       = {Yichuan Deng and
                  Zhao Song and
                  Zifan Wang and
                  Han Zhang},
  title        = {Streaming Kernel {PCA} Algorithm With Small Space},
  journal      = {CoRR},
  volume       = {abs/2303.04555},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2303-06210,
  author       = {Anshumali Shrivastava and
                  Zhao Song and
                  Zhaozhuo Xu},
  title        = {A Theoretical Analysis Of Nearest Neighbor Search On Approximate Near
                  Neighbor Graph},
  journal      = {CoRR},
  volume       = {abs/2303.06210},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2303-06895,
  author       = {Yichuan Deng and
                  Zhihang Li and
                  Zhao Song},
  title        = {An Improved Sample Complexity for Rank-1 Matrix Sensing},
  journal      = {CoRR},
  volume       = {abs/2303.06895},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2303-12298,
  author       = {Lianke Qin and
                  Zhao Song and
                  Ruizhe Zhang},
  title        = {A General Algorithm for Solving Rank-one Matrix Sensing},
  journal      = {CoRR},
  volume       = {abs/2303.12298},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2303-15725,
  author       = {Zhihang Li and
                  Zhao Song and
                  Tianyi Zhou},
  title        = {Solving Regularized Exp, Cosh and Sinh Regression Problems},
  journal      = {CoRR},
  volume       = {abs/2303.15725},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2303-16504,
  author       = {Yeqi Gao and
                  Sridhar Mahadevan and
                  Zhao Song},
  title        = {An Over-parameterized Exponential Regression},
  journal      = {CoRR},
  volume       = {abs/2303.16504},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2304-02207,
  author       = {Jan van den Brand and
                  Zhao Song and
                  Tianyi Zhou},
  title        = {Algorithm and Hardness for Dynamic Attention Maintenance in Large
                  Language Models},
  journal      = {CoRR},
  volume       = {abs/2304.02207},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2304-03426,
  author       = {Haotian Jiang and
                  Yin Tat Lee and
                  Zhao Song and
                  Lichen Zhang},
  title        = {Convex Minimization with Integer Minima in {\~{O}}(n\({}^{\mbox{4}}\))
                  Time},
  journal      = {CoRR},
  volume       = {abs/2304.03426},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2304-04397,
  author       = {Yichuan Deng and
                  Sridhar Mahadevan and
                  Zhao Song},
  title        = {Randomized and Deterministic Attention Sparsification Algorithms for
                  Over-parameterized Feature Dimension},
  journal      = {CoRR},
  volume       = {abs/2304.04397},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2304-06594,
  author       = {Yichuan Deng and
                  Yeqi Gao and
                  Zhao Song},
  title        = {Solving Tensor Low Cycle Rank Approximation},
  journal      = {CoRR},
  volume       = {abs/2304.06594},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2304-10411,
  author       = {Yichuan Deng and
                  Zhihang Li and
                  Zhao Song},
  title        = {Attention Scheme Inspired Softmax Regression},
  journal      = {CoRR},
  volume       = {abs/2304.10411},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2304-13276,
  author       = {Shuai Li and
                  Zhao Song and
                  Yu Xia and
                  Tong Yu and
                  Tianyi Zhou},
  title        = {The Closeness of In-Context Learning and Weight Shifting for Softmax
                  Regression},
  journal      = {CoRR},
  volume       = {abs/2304.13276},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2305-00660,
  author       = {Yeqi Gao and
                  Zhao Song and
                  Junze Yin},
  title        = {An Iterative Algorithm for Rescaled Hyperbolic Functions Regression},
  journal      = {CoRR},
  volume       = {abs/2305.00660},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2305-04701,
  author       = {Yeqi Gao and
                  Zhao Song and
                  Xin Yang},
  title        = {Differentially Private Attention Computation},
  journal      = {CoRR},
  volume       = {abs/2305.04701},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2305-08001,
  author       = {Zhao Song and
                  Mingquan Ye},
  title        = {Efficient Asynchronize Stochastic Gradient Algorithm with Structured
                  Data},
  journal      = {CoRR},
  volume       = {abs/2305.08001},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2305-08353,
  author       = {Zhao Song and
                  Weixin Wang and
                  Chenbo Yin},
  title        = {Fast and Efficient Matching Algorithm with Deadline Instances},
  journal      = {CoRR},
  volume       = {abs/2305.08353},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2305-08367,
  author       = {Lianke Qin and
                  Zhao Song and
                  Yitan Wang},
  title        = {Fast Submodular Function Maximization},
  journal      = {CoRR},
  volume       = {abs/2305.08367},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2305-17482,
  author       = {Song Bian and
                  Zhao Song and
                  Junze Yin},
  title        = {Federated Empirical Risk Minimization via Second-Order Method},
  journal      = {CoRR},
  volume       = {abs/2305.17482},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2306-00406,
  author       = {Yichuan Deng and
                  Zhao Song and
                  Junze Yin},
  title        = {Faster Robust Tensor Power Method for Arbitrary Order},
  journal      = {CoRR},
  volume       = {abs/2306.00406},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2306-02295,
  author       = {Ritwik Sinha and
                  Zhao Song and
                  Tianyi Zhou},
  title        = {A Mathematical Abstraction for Balancing the Trade-off Between Creativity
                  and Reality in Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2306.02295},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2306-02381,
  author       = {Xiaoxiao Li and
                  Zhao Song and
                  Guangyi Zhang},
  title        = {Sparse Convolution for Approximate Sparse Instance},
  journal      = {CoRR},
  volume       = {abs/2306.02381},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2306-03356,
  author       = {Xiang Chen and
                  Zhao Song and
                  Baocheng Sun and
                  Junze Yin and
                  Danyang Zhuo},
  title        = {Query Complexity of Active Learning for Function Family With Nearly
                  Orthogonal Basis},
  journal      = {CoRR},
  volume       = {abs/2306.03356},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2306-04169,
  author       = {Zhao Song and
                  Mingquan Ye and
                  Junze Yin and
                  Lichen Zhang},
  title        = {Efficient Alternating Minimization with Applications to Weighted Low
                  Rank Approximation},
  journal      = {CoRR},
  volume       = {abs/2306.04169},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2306-04933,
  author       = {Junda Wu and
                  Tong Yu and
                  Rui Wang and
                  Zhao Song and
                  Ruiyi Zhang and
                  Handong Zhao and
                  Chaochao Lu and
                  Shuai Li and
                  Ricardo Henao},
  title        = {InfoPrompt: Information-Theoretic Soft Prompt Tuning for Natural Language
                  Understanding},
  journal      = {CoRR},
  volume       = {abs/2306.04933},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2306-07587,
  author       = {Yichuan Deng and
                  Zhao Song and
                  Lichen Zhang and
                  Ruizhe Zhang},
  title        = {Efficient Algorithm for Solving Hyperbolic Programs},
  journal      = {CoRR},
  volume       = {abs/2306.07587},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2306-14048,
  author       = {Zhenyu Zhang and
                  Ying Sheng and
                  Tianyi Zhou and
                  Tianlong Chen and
                  Lianmin Zheng and
                  Ruisi Cai and
                  Zhao Song and
                  Yuandong Tian and
                  Christopher R{\'{e}} and
                  Clark W. Barrett and
                  Zhangyang Wang and
                  Beidi Chen},
  title        = {H\({}_{\mbox{2}}\)O: Heavy-Hitter Oracle for Efficient Generative
                  Inference of Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2306.14048},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2307-02419,
  author       = {Yeqi Gao and
                  Zhao Song and
                  Shenghao Xie},
  title        = {In-Context Learning for Attention Scheme: from Single Softmax Regression
                  to Multiple Softmax Regression via a Tensor Trick},
  journal      = {CoRR},
  volume       = {abs/2307.02419},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2307-06565,
  author       = {Lianke Qin and
                  Zhao Song and
                  Yuanyuan Yang},
  title        = {Efficient {SGD} Neural Network Training via Sublinear Activated Neuron
                  Identification},
  journal      = {CoRR},
  volume       = {abs/2307.06565},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2307-07735,
  author       = {Yuzhou Gu and
                  Zhao Song and
                  Lichen Zhang},
  title        = {A Nearly-Linear Time Algorithm for Structured Support Vector Machines},
  journal      = {CoRR},
  volume       = {abs/2307.07735},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2307-08045,
  author       = {Yeqi Gao and
                  Zhao Song and
                  Xin Yang and
                  Ruizhe Zhang},
  title        = {Fast Quantum Algorithm for Attention Computation},
  journal      = {CoRR},
  volume       = {abs/2307.08045},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2307-08352,
  author       = {Yichuan Deng and
                  Zhihang Li and
                  Sridhar Mahadevan and
                  Zhao Song},
  title        = {Zero-th Order Algorithm for Softmax Attention Optimization},
  journal      = {CoRR},
  volume       = {abs/2307.08352},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2308-08358,
  author       = {Yichuan Deng and
                  Zhao Song and
                  Shenghao Xie},
  title        = {Convergence of Two-Layer Regression with Nonlinear Units},
  journal      = {CoRR},
  volume       = {abs/2308.08358},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2308-10502,
  author       = {Yeqi Gao and
                  Zhao Song and
                  Junze Yin},
  title        = {GradientCoin: {A} Peer-to-Peer Decentralized Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2308.10502},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2308-10722,
  author       = {Yichuan Deng and
                  Michalis Mamakos and
                  Zhao Song},
  title        = {Clustered Linear Contextual Bandits with Knapsacks},
  journal      = {CoRR},
  volume       = {abs/2308.10722},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2308-12247,
  author       = {Timothy Chu and
                  Zhao Song and
                  Chiwun Yang},
  title        = {How to Protect Copyright Data in Optimization of Large Language Models?},
  journal      = {CoRR},
  volume       = {abs/2308.12247},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2308-14304,
  author       = {Zhao Song and
                  Junze Yin and
                  Lichen Zhang},
  title        = {Solving Attention Kernel Regression Problem via Pre-conditioner},
  journal      = {CoRR},
  volume       = {abs/2308.14304},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2309-01030,
  author       = {Lianke Qin and
                  Aravind Reddy and
                  Zhao Song},
  title        = {Online Adaptive Mahalanobis Distance Estimation},
  journal      = {CoRR},
  volume       = {abs/2309.01030},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2309-05135,
  author       = {Zhao Song and
                  Mingquan Ye and
                  Lichen Zhang},
  title        = {Streaming Semidefinite Programs: O({\(\surd\)}n) Passes, Small Space
                  and Fast Runtime},
  journal      = {CoRR},
  volume       = {abs/2309.05135},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2309-07418,
  author       = {Yeqi Gao and
                  Zhao Song and
                  Weixin Wang and
                  Junze Yin},
  title        = {A Fast Optimization View: Reformulating Single Layer Attention in
                  {LLM} Based on Tensor and {SVM} Trick, and Solving It in Matrix Multiplication
                  Time},
  journal      = {CoRR},
  volume       = {abs/2309.07418},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2309-07452,
  author       = {Lianke Qin and
                  Zhao Song and
                  Baocheng Sun},
  title        = {Is Solving Graph Neural Tangent Kernel Equivalent to Training Graph
                  Neural Network?},
  journal      = {CoRR},
  volume       = {abs/2309.07452},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2309-13482,
  author       = {Zhao Song and
                  Weixin Wang and
                  Junze Yin},
  title        = {A Unified Scheme of ResNet and Softmax},
  journal      = {CoRR},
  volume       = {abs/2309.13482},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2310-03331,
  author       = {Timothy Chu and
                  Zhao Song and
                  Chiwun Yang},
  title        = {Fine-tune Language Models to Approximate Unbiased In-context Learning},
  journal      = {CoRR},
  volume       = {abs/2310.03331},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2310-04064,
  author       = {Josh Alman and
                  Zhao Song},
  title        = {How to Capture Higher-order Correlations? Generalizing Matrix Softmax
                  Attention to Kronecker Computation},
  journal      = {CoRR},
  volume       = {abs/2310.04064},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2310-11291,
  author       = {Zhao Song and
                  Chiwun Yang},
  title        = {An Automatic Learning Rate Schedule Algorithm for Achieving Faster
                  Convergence and Steeper Descent},
  journal      = {CoRR},
  volume       = {abs/2310.11291},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2310-11685,
  author       = {Yichuan Deng and
                  Zhao Song and
                  Tianyi Zhou},
  title        = {Superiority of Softmax: Unveiling the Performance Edge Over Linear
                  Attention},
  journal      = {CoRR},
  volume       = {abs/2310.11685},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2310-12462,
  author       = {Yichuan Deng and
                  Zhao Song and
                  Shenghao Xie and
                  Chiwun Yang},
  title        = {Unmasking Transformers: {A} Theoretical Approach to Data Recovery
                  via Attention Weights},
  journal      = {CoRR},
  volume       = {abs/2310.12462},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2310-17157,
  author       = {Zichang Liu and
                  Jue Wang and
                  Tri Dao and
                  Tianyi Zhou and
                  Binhang Yuan and
                  Zhao Song and
                  Anshumali Shrivastava and
                  Ce Zhang and
                  Yuandong Tian and
                  Christopher R{\'{e}} and
                  Beidi Chen},
  title        = {Deja Vu: Contextual Sparsity for Efficient LLMs at Inference Time},
  journal      = {CoRR},
  volume       = {abs/2310.17157},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2310-20051,
  author       = {Zhao Song and
                  Guangyi Xu and
                  Junze Yin},
  title        = {The Expressibility of Polynomial based Attention Scheme},
  journal      = {CoRR},
  volume       = {abs/2310.20051},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2311-11429,
  author       = {Lianke Qin and
                  Saayan Mitra and
                  Zhao Song and
                  Yuanyuan Yang and
                  Tianyi Zhou},
  title        = {Fast Heavy Inner Product Identification Between Weights and Inputs
                  in Neural Network Training},
  journal      = {CoRR},
  volume       = {abs/2311.11429},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2311-13624,
  author       = {Chenyang Li and
                  Zhao Song and
                  Weixin Wang and
                  Chiwun Yang},
  title        = {A Theoretical Insight into Attack and Defense of Gradient Leakage
                  in Transformer},
  journal      = {CoRR},
  volume       = {abs/2311.13624},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2311-14652,
  author       = {Raghav Addanki and
                  Chenyang Li and
                  Zhao Song and
                  Chiwun Yang},
  title        = {One Pass Streaming Algorithm for Super Long Token Attention Approximation
                  in Sublinear Space},
  journal      = {CoRR},
  volume       = {abs/2311.14652},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2311-14823,
  author       = {Zhao Song and
                  Junze Yin and
                  Ruizhe Zhang},
  title        = {Revisiting Quantum Algorithms for Linear Regressions: Quadratic Speedups
                  without Data-Dependent Parameters},
  journal      = {CoRR},
  volume       = {abs/2311.14823},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2311-15390,
  author       = {Zhihang Li and
                  Zhao Song and
                  Zifan Wang and
                  Junze Yin},
  title        = {Local Convergence of Approximate Newton Method for Two Layer Nonlinear
                  Regression},
  journal      = {CoRR},
  volume       = {abs/2311.15390},
  year         = {2023}
}
@article{DBLP:journals/pvldb/QinJS0ZC22,
  author       = {Lianke Qin and
                  Rajesh Jayaram and
                  Elaine Shi and
                  Zhao Song and
                  Danyang Zhuo and
                  Shumo Chu},
  title        = {Differentially Oblivious Relational Database Operators},
  journal      = {Proc. {VLDB} Endow.},
  volume       = {16},
  number       = {4},
  pages        = {842--855},
  year         = {2022}
}
@article{DBLP:journals/quantum/GilyenST22,
  author       = {Andr{\'{a}}s Gily{\'{e}}n and
                  Zhao Song and
                  Ewin Tang},
  title        = {An improved quantum-inspired algorithm for linear regression},
  journal      = {Quantum},
  volume       = {6},
  pages        = {754},
  year         = {2022}
}
@inproceedings{DBLP:conf/aaai/JiangM0YZ22,
  author       = {Shunhua Jiang and
                  Yunze Man and
                  Zhao Song and
                  Zheng Yu and
                  Danyang Zhuo},
  title        = {Fast Graph Neural Tangent Kernel via Kronecker Sketching},
  booktitle    = {{AAAI}},
  pages        = {7033--7041},
  publisher    = {{AAAI} Press},
  year         = {2022}
}
@inproceedings{DBLP:conf/approx/SongZ22,
  author       = {Zhao Song and
                  Ruizhe Zhang},
  title        = {Hyperbolic Concentration, Anti-Concentration, and Discrepancy},
  booktitle    = {{APPROX/RANDOM}},
  series       = {LIPIcs},
  volume       = {245},
  pages        = {10:1--10:19},
  publisher    = {Schloss Dagstuhl - Leibniz-Zentrum f{\"{u}}r Informatik},
  year         = {2022}
}
@inproceedings{DBLP:conf/bigdataconf/QinRSXZ22,
  author       = {Lianke Qin and
                  Aravind Reddy and
                  Zhao Song and
                  Zhaozhuo Xu and
                  Danyang Zhuo},
  title        = {Adaptive and Dynamic Multi-Resolution Hashing for Pairwise Summations},
  booktitle    = {{IEEE} Big Data},
  pages        = {115--120},
  publisher    = {{IEEE}},
  year         = {2022}
}
@inproceedings{DBLP:conf/bigdataconf/LiSTZ22,
  author       = {Xiaoxiao Li and
                  Zhao Song and
                  Runzhou Tao and
                  Guangyi Zhang},
  title        = {A Convergence Theory for Federated Average: Beyond Smoothness},
  booktitle    = {{IEEE} Big Data},
  pages        = {1292--1297},
  publisher    = {{IEEE}},
  year         = {2022}
}
@inproceedings{DBLP:conf/focs/HuangJ0T022,
  author       = {Baihe Huang and
                  Shunhua Jiang and
                  Zhao Song and
                  Runzhou Tao and
                  Ruizhe Zhang},
  title        = {Solving {SDP} Faster: {A} Robust {IPM} Framework and Efficient Implementation},
  booktitle    = {{FOCS}},
  pages        = {233--244},
  publisher    = {{IEEE}},
  year         = {2022}
}
@inproceedings{DBLP:conf/iclr/ChenDLY0RR22,
  author       = {Beidi Chen and
                  Tri Dao and
                  Kaizhao Liang and
                  Jiaming Yang and
                  Zhao Song and
                  Atri Rudra and
                  Christopher R{\'{e}}},
  title        = {Pixelated Butterfly: Simple and Efficient Sparse training for Neural
                  Network Models},
  booktitle    = {{ICLR}},
  publisher    = {OpenReview.net},
  year         = {2022}
}
@inproceedings{DBLP:conf/icml/ChenFNZ0FR22,
  author       = {Mayee F. Chen and
                  Daniel Y. Fu and
                  Avanika Narayan and
                  Michael Zhang and
                  Zhao Song and
                  Kayvon Fatahalian and
                  Christopher R{\'{e}}},
  title        = {Perfectly Balanced: Improving Transfer and Robustness of Supervised
                  Contrastive Learning},
  booktitle    = {{ICML}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {162},
  pages        = {3090--3122},
  publisher    = {{PMLR}},
  year         = {2022}
}
@inproceedings{DBLP:conf/icml/MunteanuO0W22,
  author       = {Alexander Munteanu and
                  Simon Omlor and
                  Zhao Song and
                  David P. Woodruff},
  title        = {Bounding the Width of Neural Networks via Coupled Initialization {A}
                  Worst Case Analysis},
  booktitle    = {{ICML}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {162},
  pages        = {16083--16122},
  publisher    = {{PMLR}},
  year         = {2022}
}
@inproceedings{DBLP:conf/icml/ReddyR0RMLWKA22,
  author       = {Aravind Reddy and
                  Ryan A. Rossi and
                  Zhao Song and
                  Anup B. Rao and
                  Tung Mai and
                  Nedim Lipka and
                  Gang Wu and
                  Eunyee Koh and
                  Nesreen K. Ahmed},
  title        = {One-Pass Algorithms for {MAP} Inference of Nonsymmetric Determinantal
                  Point Processes},
  booktitle    = {{ICML}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {162},
  pages        = {18463--18482},
  publisher    = {{PMLR}},
  year         = {2022}
}
@inproceedings{DBLP:conf/innovations/Chen0T022,
  author       = {Sitan Chen and
                  Zhao Song and
                  Runzhou Tao and
                  Ruizhe Zhang},
  title        = {Symmetric Sparse Boolean Matrix Factorization and Applications},
  booktitle    = {{ITCS}},
  series       = {LIPIcs},
  volume       = {215},
  pages        = {46:1--46:25},
  publisher    = {Schloss Dagstuhl - Leibniz-Zentrum f{\"{u}}r Informatik},
  year         = {2022}
}
@inproceedings{DBLP:conf/nips/00020W022,
  author       = {Yichuan Deng and
                  Zhao Song and
                  Omri Weinstein and
                  Ruizhe Zhang},
  title        = {Fast Distance Oracles for Any Symmetric Norm},
  booktitle    = {NeurIPS},
  year         = {2022}
}
@inproceedings{DBLP:conf/nips/Reddy0022,
  author       = {Aravind Reddy and
                  Zhao Song and
                  Lichen Zhang},
  title        = {Dynamic Tensor Product Regression},
  booktitle    = {NeurIPS},
  year         = {2022}
}
@article{DBLP:journals/corr/abs-2202-12329,
  author       = {Baihe Huang and
                  Zhao Song and
                  Omri Weinstein and
                  Hengjie Zhang and
                  Ruizhe Zhang},
  title        = {A Dynamic Fast Gaussian Transform},
  journal      = {CoRR},
  volume       = {abs/2202.12329},
  year         = {2022}
}
@article{DBLP:journals/corr/abs-2204-03209,
  author       = {Zhao Song and
                  Zhaozhuo Xu and
                  Lichen Zhang},
  title        = {Speeding Up Sparsification using Inner Product Search Data Structures},
  journal      = {CoRR},
  volume       = {abs/2204.03209},
  year         = {2022}
}
@article{DBLP:journals/corr/abs-2204-07596,
  author       = {Mayee F. Chen and
                  Daniel Y. Fu and
                  Avanika Narayan and
                  Michael Zhang and
                  Zhao Song and
                  Kayvon Fatahalian and
                  Christopher R{\'{e}}},
  title        = {Perfectly Balanced: Improving Transfer and Robustness of Supervised
                  Contrastive Learning},
  journal      = {CoRR},
  volume       = {abs/2204.07596},
  year         = {2022}
}
@article{DBLP:journals/corr/abs-2204-10979,
  author       = {Kai Wang and
                  Zhao Song and
                  Georgios Theocharous and
                  Sridhar Mahadevan},
  title        = {Smoothed Online Combinatorial Optimization Using Imperfect Predictions},
  journal      = {CoRR},
  volume       = {abs/2204.10979},
  year         = {2022}
}
@article{DBLP:journals/corr/abs-2205-00658,
  author       = {Zhao Song and
                  Baocheng Sun and
                  Omri Weinstein and
                  Ruizhe Zhang},
  title        = {Sparse Fourier Transform over Lattices: {A} Unified Approach to Signal
                  Reconstruction},
  journal      = {CoRR},
  volume       = {abs/2205.00658},
  year         = {2022}
}
@article{DBLP:journals/corr/abs-2205-14816,
  author       = {Yichuan Deng and
                  Zhao Song and
                  Omri Weinstein and
                  Ruizhe Zhang},
  title        = {Fast Distance Oracles for Any Symmetric Norm},
  journal      = {CoRR},
  volume       = {abs/2205.14816},
  year         = {2022}
}
@article{DBLP:journals/corr/abs-2206-12802,
  author       = {Alexander Munteanu and
                  Simon Omlor and
                  Zhao Song and
                  David P. Woodruff},
  title        = {Bounding the Width of Neural Networks via Coupled Initialization -
                  {A} Worst Case Analysis},
  journal      = {CoRR},
  volume       = {abs/2206.12802},
  year         = {2022}
}
@article{DBLP:journals/corr/abs-2207-09002,
  author       = {Zhao Song and
                  Zhaozhuo Xu and
                  Yuanyuan Yang and
                  Lichen Zhang},
  title        = {Accelerating Frank-Wolfe Algorithm using Low-Dimensional and Adaptive
                  Data Structures},
  journal      = {CoRR},
  volume       = {abs/2207.09002},
  year         = {2022}
}
@article{DBLP:journals/corr/abs-2208-03367,
  author       = {Hang Hu and
                  Zhao Song and
                  Runzhou Tao and
                  Zhaozhuo Xu and
                  Danyang Zhuo},
  title        = {Sublinear Time Algorithm for Online Weighted Bipartite Matching},
  journal      = {CoRR},
  volume       = {abs/2208.03367},
  year         = {2022}
}
@article{DBLP:journals/corr/abs-2208-03635,
  author       = {Xiaoxiao Li and
                  Zhao Song and
                  Jiaming Yang},
  title        = {Federated Adversarial Learning: {A} Framework with Convergence Analysis},
  journal      = {CoRR},
  volume       = {abs/2208.03635},
  year         = {2022}
}
@article{DBLP:journals/corr/abs-2208-03915,
  author       = {Jiehao Liang and
                  Zhao Song and
                  Zhaozhuo Xu and
                  Danyang Zhuo},
  title        = {Dynamic Maintenance of Kernel Density Estimation Data Structure: From
                  Practice to Theory},
  journal      = {CoRR},
  volume       = {abs/2208.03915},
  year         = {2022}
}
@article{DBLP:journals/corr/abs-2208-04508,
  author       = {Hang Hu and
                  Zhao Song and
                  Omri Weinstein and
                  Danyang Zhuo},
  title        = {Training Overparametrized Neural Networks in Sublinear Time},
  journal      = {CoRR},
  volume       = {abs/2208.04508},
  year         = {2022}
}
@article{DBLP:journals/corr/abs-2208-05395,
  author       = {Yeqi Gao and
                  Lianke Qin and
                  Zhao Song and
                  Yitan Wang},
  title        = {A Sublinear Adversarial Training Algorithm},
  journal      = {CoRR},
  volume       = {abs/2208.05395},
  year         = {2022}
}
@article{DBLP:journals/corr/abs-2208-09634,
  author       = {Yeqi Gao and
                  Zhao Song and
                  Baocheng Sun},
  title        = {An O(k log n) Time Fourier Set Query Algorithm},
  journal      = {CoRR},
  volume       = {abs/2208.09634},
  year         = {2022}
}
@article{DBLP:journals/corr/abs-2210-03961,
  author       = {Aravind Reddy and
                  Zhao Song and
                  Lichen Zhang},
  title        = {Dynamic Tensor Product Regression},
  journal      = {CoRR},
  volume       = {abs/2210.03961},
  year         = {2022}
}
@article{DBLP:journals/corr/abs-2210-08361,
  author       = {Yichuan Deng and
                  Zhao Song and
                  Yitan Wang and
                  Yuanyuan Yang},
  title        = {A Nearly Optimal Size Coreset Algorithm with Nearly Linear Time},
  journal      = {CoRR},
  volume       = {abs/2210.08361},
  year         = {2022}
}
@article{DBLP:journals/corr/abs-2210-08371,
  author       = {Zhao Song and
                  Yitan Wang and
                  Zheng Yu and
                  Lichen Zhang},
  title        = {Sketching for First Order Method: Efficient Algorithm for Low-Bandwidth
                  Channel and Vulnerability},
  journal      = {CoRR},
  volume       = {abs/2210.08371},
  year         = {2022}
}
@article{DBLP:journals/corr/abs-2210-11542,
  author       = {Zhao Song and
                  Xin Yang and
                  Yuanyuan Yang and
                  Lichen Zhang},
  title        = {Sketching Meets Differential Privacy: Fast Algorithm for Dynamic Kronecker
                  Projection Maintenance},
  journal      = {CoRR},
  volume       = {abs/2210.11542},
  year         = {2022}
}
@article{DBLP:journals/corr/abs-2210-12468,
  author       = {Yichuan Deng and
                  Zhao Song and
                  Omri Weinstein},
  title        = {Discrepancy Minimization in Input-Sparsity Time},
  journal      = {CoRR},
  volume       = {abs/2210.12468},
  year         = {2022}
}
@article{DBLP:journals/corr/abs-2210-12495,
  author       = {Zhao Song and
                  Baocheng Sun and
                  Omri Weinstein and
                  Ruizhe Zhang},
  title        = {Quartic Samples Suffice for Fourier Interpolation},
  journal      = {CoRR},
  volume       = {abs/2210.12495},
  year         = {2022}
}
@article{DBLP:journals/corr/abs-2211-01588,
  author       = {Xiaoxiao Li and
                  Zhao Song and
                  Runzhou Tao and
                  Guangyi Zhang},
  title        = {A Convergence Theory for Federated Average: Beyond Smoothness},
  journal      = {CoRR},
  volume       = {abs/2211.01588},
  year         = {2022}
}
@article{DBLP:journals/corr/abs-2211-06033,
  author       = {Yuzhou Gu and
                  Zhao Song},
  title        = {A Faster Small Treewidth {SDP} Solver},
  journal      = {CoRR},
  volume       = {abs/2211.06033},
  year         = {2022}
}
@article{DBLP:journals/corr/abs-2211-14227,
  author       = {Josh Alman and
                  Jiehao Liang and
                  Zhao Song and
                  Ruizhe Zhang and
                  Danyang Zhuo},
  title        = {Bypass Exponential Time Preprocessing: Fast Neural Network Training
                  via Weight-Data Correlation Preprocessing},
  journal      = {CoRR},
  volume       = {abs/2211.14227},
  year         = {2022}
}
@article{DBLP:journals/corr/abs-2211-14407,
  author       = {Zhao Song and
                  Xin Yang and
                  Yuanyuan Yang and
                  Tianyi Zhou},
  title        = {Faster Algorithm for Structured John Ellipsoid Computation},
  journal      = {CoRR},
  volume       = {abs/2211.14407},
  year         = {2022}
}
@article{DBLP:journals/corr/abs-2211-14825,
  author       = {Yichuan Deng and
                  Wenyu Jin and
                  Zhao Song and
                  Xiaorui Sun and
                  Omri Weinstein},
  title        = {Dynamic Kernel Sparsifiers},
  journal      = {CoRR},
  volume       = {abs/2211.14825},
  year         = {2022}
}
@article{DBLP:journals/corr/abs-2211-15118,
  author       = {Jiehao Liang and
                  Somdeb Sarkhel and
                  Zhao Song and
                  Chenbo Yin and
                  Danyang Zhuo},
  title        = {A Faster k-means++ Algorithm},
  journal      = {CoRR},
  volume       = {abs/2211.15118},
  year         = {2022}
}
@article{DBLP:journals/corr/abs-2212-05176,
  author       = {Lianke Qin and
                  Rajesh Jayaram and
                  Elaine Shi and
                  Zhao Song and
                  Danyang Zhuo and
                  Shumo Chu},
  title        = {Adore: Differentially Oblivious Relational Database Operators},
  journal      = {CoRR},
  volume       = {abs/2212.05176},
  year         = {2022}
}
@article{DBLP:journals/corr/abs-2212-11408,
  author       = {Lianke Qin and
                  Aravind Reddy and
                  Zhao Song and
                  Zhaozhuo Xu and
                  Danyang Zhuo},
  title        = {Adaptive and Dynamic Multi-Resolution Hashing for Pairwise Summations},
  journal      = {CoRR},
  volume       = {abs/2212.11408},
  year         = {2022}
}
@article{DBLP:journals/eccc/0001KPS0Y22,
  author       = {Lijie Chen and
                  Gillat Kol and
                  Dmitry Paramonov and
                  Raghuvansh Saxena and
                  Zhao Song and
                  Huacheng Yu},
  title        = {Towards Multi-Pass Streaming Lower Bounds for Optimal Approximation
                  of Max-Cut},
  journal      = {Electron. Colloquium Comput. Complex.},
  volume       = {{TR22-161}},
  year         = {2022}
}
@article{DBLP:journals/jacm/CohenLS21,
  author       = {Michael B. Cohen and
                  Yin Tat Lee and
                  Zhao Song},
  title        = {Solving Linear Programs in the Current Matrix Multiplication Time},
  journal      = {J. {ACM}},
  volume       = {68},
  number       = {1},
  pages        = {3:1--3:39},
  year         = {2021}
}
@inproceedings{DBLP:conf/icalp/0001KPS0Y21,
  author       = {Lijie Chen and
                  Gillat Kol and
                  Dmitry Paramonov and
                  Raghuvansh R. Saxena and
                  Zhao Song and
                  Huacheng Yu},
  title        = {Near-Optimal Two-Pass Streaming Algorithm for Sampling Random Walks
                  over Directed Graphs},
  booktitle    = {{ICALP}},
  series       = {LIPIcs},
  volume       = {198},
  pages        = {52:1--52:19},
  publisher    = {Schloss Dagstuhl - Leibniz-Zentrum f{\"{u}}r Informatik},
  year         = {2021}
}
@inproceedings{DBLP:conf/iclr/ChenL0Z21,
  author       = {Sitan Chen and
                  Xiaoxiao Li and
                  Zhao Song and
                  Danyang Zhuo},
  title        = {On InstaHide, Phase Retrieval, and Sparse Matrix Factorization},
  booktitle    = {{ICLR}},
  publisher    = {OpenReview.net},
  year         = {2021}
}
@inproceedings{DBLP:conf/iclr/ChenLPXLD0SR21,
  author       = {Beidi Chen and
                  Zichang Liu and
                  Binghui Peng and
                  Zhaozhuo Xu and
                  Jonathan Lingjie Li and
                  Tri Dao and
                  Zhao Song and
                  Anshumali Shrivastava and
                  Christopher R{\'{e}}},
  title        = {{MONGOOSE:} {A} Learnable {LSH} Framework for Efficient Neural Network
                  Training},
  booktitle    = {{ICLR}},
  publisher    = {OpenReview.net},
  year         = {2021}
}
@inproceedings{DBLP:conf/icml/HuangL0021,
  author       = {Baihe Huang and
                  Xiaoxiao Li and
                  Zhao Song and
                  Xin Yang},
  title        = {{FL-NTK:} {A} Neural Tangent Kernel-based Framework for Federated
                  Learning Analysis},
  booktitle    = {{ICML}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {139},
  pages        = {4423--4434},
  publisher    = {{PMLR}},
  year         = {2021}
}
@inproceedings{DBLP:conf/icml/0002WYZ21,
  author       = {Zhao Song and
                  David P. Woodruff and
                  Zheng Yu and
                  Lichen Zhang},
  title        = {Fast Sketching of Polynomial Kernels of Polynomial Degree},
  booktitle    = {{ICML}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {139},
  pages        = {9812--9823},
  publisher    = {{PMLR}},
  year         = {2021}
}
@inproceedings{DBLP:conf/icml/0002Y21,
  author       = {Zhao Song and
                  Zheng Yu},
  title        = {Oblivious Sketching-based Central Path Method for Linear Programming},
  booktitle    = {{ICML}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {139},
  pages        = {9835--9847},
  publisher    = {{PMLR}},
  year         = {2021}
}
@inproceedings{DBLP:conf/innovations/BrandP0W21,
  author       = {Jan van den Brand and
                  Binghui Peng and
                  Zhao Song and
                  Omri Weinstein},
  title        = {Training (Overparametrized) Neural Networks in Near-Linear Time},
  booktitle    = {{ITCS}},
  series       = {LIPIcs},
  volume       = {185},
  pages        = {63:1--63:15},
  publisher    = {Schloss Dagstuhl - Leibniz-Zentrum f{\"{u}}r Informatik},
  year         = {2021}
}
@inproceedings{DBLP:conf/nips/XuSS21,
  author       = {Zhaozhuo Xu and
                  Zhao Song and
                  Anshumali Shrivastava},
  title        = {Breaking the Linear Iteration Cost Barrier for Some Well-known Conditional
                  Gradient Methods Using MaxIP Data-structures},
  booktitle    = {NeurIPS},
  pages        = {5576--5589},
  year         = {2021}
}
@inproceedings{DBLP:conf/nips/HuangGSLA21,
  author       = {Yangsibo Huang and
                  Samyak Gupta and
                  Zhao Song and
                  Kai Li and
                  Sanjeev Arora},
  title        = {Evaluating Gradient Inversion Attacks and Defenses in Federated Learning},
  booktitle    = {NeurIPS},
  pages        = {7232--7241},
  year         = {2021}
}
@inproceedings{DBLP:conf/nips/ChenDWSRR21,
  author       = {Beidi Chen and
                  Tri Dao and
                  Eric Winsor and
                  Zhao Song and
                  Atri Rudra and
                  Christopher R{\'{e}}},
  title        = {Scatterbrain: Unifying Sparse and Low-rank Attention},
  booktitle    = {NeurIPS},
  pages        = {17413--17426},
  year         = {2021}
}
@inproceedings{DBLP:conf/nips/SongYZ21,
  author       = {Zhao Song and
                  Shuo Yang and
                  Ruizhe Zhang},
  title        = {Does Preprocessing Help Training Over-parameterized Neural Networks?},
  booktitle    = {NeurIPS},
  pages        = {22890--22904},
  year         = {2021}
}
@inproceedings{DBLP:conf/stoc/0001KPS0Y21,
  author       = {Lijie Chen and
                  Gillat Kol and
                  Dmitry Paramonov and
                  Raghuvansh R. Saxena and
                  Zhao Song and
                  Huacheng Yu},
  title        = {Almost optimal super-constant-pass streaming lower bounds for reachability},
  booktitle    = {{STOC}},
  pages        = {570--583},
  publisher    = {{ACM}},
  year         = {2021}
}
@inproceedings{DBLP:conf/stoc/Jiang0WZ21,
  author       = {Shunhua Jiang and
                  Zhao Song and
                  Omri Weinstein and
                  Hengjie Zhang},
  title        = {A faster algorithm for solving general LPs},
  booktitle    = {{STOC}},
  pages        = {823--832},
  publisher    = {{ACM}},
  year         = {2021}
}
@inproceedings{DBLP:conf/stoc/BrandLLSS0W21,
  author       = {Jan van den Brand and
                  Yin Tat Lee and
                  Yang P. Liu and
                  Thatchaphol Saranurak and
                  Aaron Sidford and
                  Zhao Song and
                  Di Wang},
  title        = {Minimum cost flows, MDPs, and {\(\mathscr{l}\)}\({}_{\mbox{1}}\)-regression
                  in nearly linear time for dense instances},
  booktitle    = {{STOC}},
  pages        = {859--869},
  publisher    = {{ACM}},
  year         = {2021}
}
@inproceedings{DBLP:conf/uai/DuH0S0021,
  author       = {Simon S. Du and
                  Wei Hu and
                  Zhiyuan Li and
                  Ruoqi Shen and
                  Zhao Song and
                  Jiajun Wu},
  title        = {When is particle filtering efficient for planning in partially observed
                  linear dynamical systems?},
  booktitle    = {{UAI}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {161},
  pages        = {728--737},
  publisher    = {{AUAI} Press},
  year         = {2021}
}
@article{DBLP:journals/corr/abs-2101-05719,
  author       = {Jan van den Brand and
                  Yin Tat Lee and
                  Yang P. Liu and
                  Thatchaphol Saranurak and
                  Aaron Sidford and
                  Zhao Song and
                  Di Wang},
  title        = {Minimum Cost Flows, MDPs, and {\unicode{120001}}\({}_{\mbox{1}}\)-Regression
                  in Nearly Linear Time for Dense Instances},
  journal      = {CoRR},
  volume       = {abs/2101.05719},
  year         = {2021}
}
@article{DBLP:journals/corr/abs-2101-08208,
  author       = {Baihe Huang and
                  Shunhua Jiang and
                  Zhao Song and
                  Runzhou Tao},
  title        = {Solving Tall Dense SDPs in the Current Matrix Multiplication Time},
  journal      = {CoRR},
  volume       = {abs/2101.08208},
  year         = {2021}
}
@article{DBLP:journals/corr/abs-2102-01570,
  author       = {Sitan Chen and
                  Zhao Song and
                  Runzhou Tao and
                  Ruizhe Zhang},
  title        = {Symmetric Boolean Factor Analysis with Applications to InstaHide},
  journal      = {CoRR},
  volume       = {abs/2102.01570},
  year         = {2021}
}
@article{DBLP:journals/corr/abs-2102-11251,
  author       = {Lijie Chen and
                  Gillat Kol and
                  Dmitry Paramonov and
                  Raghuvansh Saxena and
                  Zhao Song and
                  Huacheng Yu},
  title        = {Near-Optimal Two-Pass Streaming Algorithm for Sampling Random Walks
                  over Directed Graphs},
  journal      = {CoRR},
  volume       = {abs/2102.11251},
  year         = {2021}
}
@article{DBLP:journals/corr/abs-2105-05001,
  author       = {Baihe Huang and
                  Xiaoxiao Li and
                  Zhao Song and
                  Xin Yang},
  title        = {{FL-NTK:} {A} Neural Tangent Kernel-based Framework for Federated
                  Learning Convergence Analysis},
  journal      = {CoRR},
  volume       = {abs/2105.05001},
  year         = {2021}
}
@article{DBLP:journals/corr/abs-2105-08285,
  author       = {Anshumali Shrivastava and
                  Zhao Song and
                  Zhaozhuo Xu},
  title        = {Sublinear Least-Squares Value Iteration via Locality Sensitive Hashing},
  journal      = {CoRR},
  volume       = {abs/2105.08285},
  year         = {2021}
}
@article{DBLP:journals/corr/abs-2108-09420,
  author       = {Zhao Song and
                  David P. Woodruff and
                  Zheng Yu and
                  Lichen Zhang},
  title        = {Fast Sketching of Polynomial Kernels of Polynomial Degree},
  journal      = {CoRR},
  volume       = {abs/2108.09420},
  year         = {2021}
}
@article{DBLP:journals/corr/abs-2110-04622,
  author       = {Zhao Song and
                  Shuo Yang and
                  Ruizhe Zhang},
  title        = {Does Preprocessing Help Training Over-parameterized Neural Networks?},
  journal      = {CoRR},
  volume       = {abs/2110.04622},
  year         = {2021}
}
@article{DBLP:journals/corr/abs-2110-15343,
  author       = {Beidi Chen and
                  Tri Dao and
                  Eric Winsor and
                  Zhao Song and
                  Atri Rudra and
                  Christopher R{\'{e}}},
  title        = {Scatterbrain: Unifying Sparse and Low-rank Attention Approximation},
  journal      = {CoRR},
  volume       = {abs/2110.15343},
  year         = {2021}
}
@article{DBLP:journals/corr/abs-2111-03030,
  author       = {Sudhanshu Chanpuriya and
                  Ryan A. Rossi and
                  Anup B. Rao and
                  Tung Mai and
                  Nedim Lipka and
                  Zhao Song and
                  Cameron Musco},
  title        = {An Interpretable Graph Generative Model with Heterophily},
  journal      = {CoRR},
  volume       = {abs/2111.03030},
  year         = {2021}
}
@article{DBLP:journals/corr/abs-2111-10538,
  author       = {Aviad Rubinstein and
                  Saeed Seddighin and
                  Zhao Song and
                  Xiaorui Sun},
  title        = {Approximation Algorithms for {LCS} and {LIS} with Truly Improved Running
                  Times},
  journal      = {CoRR},
  volume       = {abs/2111.10538},
  year         = {2021}
}
@article{DBLP:journals/corr/abs-2111-14674,
  author       = {Aravind Reddy and
                  Ryan A. Rossi and
                  Zhao Song and
                  Anup B. Rao and
                  Tung Mai and
                  Nedim Lipka and
                  Gang Wu and
                  Eunyee Koh and
                  Nesreen K. Ahmed},
  title        = {Online {MAP} Inference and Learning for Nonsymmetric Determinantal
                  Point Processes},
  journal      = {CoRR},
  volume       = {abs/2111.14674},
  year         = {2021}
}
@article{DBLP:journals/corr/abs-2111-15139,
  author       = {Anshumali Shrivastava and
                  Zhao Song and
                  Zhaozhuo Xu},
  title        = {Breaking the Linear Iteration Cost Barrier for Some Well-known Conditional
                  Gradient Methods Using MaxIP Data-structures},
  journal      = {CoRR},
  volume       = {abs/2111.15139},
  year         = {2021}
}
@article{DBLP:journals/corr/abs-2112-00029,
  author       = {Beidi Chen and
                  Tri Dao and
                  Kaizhao Liang and
                  Jiaming Yang and
                  Zhao Song and
                  Atri Rudra and
                  Christopher R{\'{e}}},
  title        = {Pixelated Butterfly: Simple and Efficient Sparse training for Neural
                  Network Models},
  journal      = {CoRR},
  volume       = {abs/2112.00029},
  year         = {2021}
}
@article{DBLP:journals/corr/abs-2112-00059,
  author       = {Yangsibo Huang and
                  Samyak Gupta and
                  Zhao Song and
                  Kai Li and
                  Sanjeev Arora},
  title        = {Evaluating Gradient Inversion Attacks and Defenses in Federated Learning},
  journal      = {CoRR},
  volume       = {abs/2112.00059},
  year         = {2021}
}
@article{DBLP:journals/corr/abs-2112-02446,
  author       = {Shunhua Jiang and
                  Yunze Man and
                  Zhao Song and
                  Zheng Yu and
                  Danyang Zhuo},
  title        = {Fast Graph Neural Tangent Kernel via Kronecker Sketching},
  journal      = {CoRR},
  volume       = {abs/2112.02446},
  year         = {2021}
}
@article{DBLP:journals/corr/abs-2112-05120,
  author       = {Wei Deng and
                  Yi{-}An Ma and
                  Zhao Song and
                  Qian Zhang and
                  Guang Lin},
  title        = {On Convergence of Federated Averaging Langevin Dynamics},
  journal      = {CoRR},
  volume       = {abs/2112.05120},
  year         = {2021}
}
@article{DBLP:journals/corr/abs-2112-07628,
  author       = {Zhao Song and
                  Lichen Zhang and
                  Ruizhe Zhang},
  title        = {Training Multi-Layer Over-Parametrized Neural Network in Subquadratic
                  Time},
  journal      = {CoRR},
  volume       = {abs/2112.07628},
  year         = {2021}
}
@article{DBLP:journals/eccc/ChenKPSSY21,
  author       = {Lijie Chen and
                  Gillat Kol and
                  Dmitry Paramonov and
                  Raghuvansh Saxena and
                  Zhao Song and
                  Huacheng Yu},
  title        = {Almost Optimal Super-Constant-Pass Streaming Lower Bounds for Reachability},
  journal      = {Electron. Colloquium Comput. Complex.},
  volume       = {{TR21-027}},
  year         = {2021}
}
@inproceedings{DBLP:conf/aistats/LiangSWY020,
  author       = {Yingyu Liang and
                  Zhao Song and
                  Mengdi Wang and
                  Lin Yang and
                  Xin Yang},
  title        = {Sketching Transformed Matrices with Applications to Natural Language
                  Processing},
  booktitle    = {{AISTATS}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {108},
  pages        = {467--481},
  publisher    = {{PMLR}},
  year         = {2020}
}
@inproceedings{DBLP:conf/emnlp/HuangSCLA20,
  author       = {Yangsibo Huang and
                  Zhao Song and
                  Danqi Chen and
                  Kai Li and
                  Sanjeev Arora},
  title        = {TextHide: Tackling Data Privacy for Language Understanding Tasks},
  booktitle    = {{EMNLP} (Findings)},
  series       = {Findings of {ACL}},
  volume       = {{EMNLP} 2020},
  pages        = {1368--1382},
  publisher    = {Association for Computational Linguistics},
  year         = {2020}
}
@inproceedings{DBLP:conf/focs/AlmanCS020,
  author       = {Josh Alman and
                  Timothy Chu and
                  Aaron Schild and
                  Zhao Song},
  title        = {Algorithms and Hardness for Linear Algebra on Geometric Graphs},
  booktitle    = {{FOCS}},
  pages        = {541--552},
  publisher    = {{IEEE}},
  year         = {2020}
}
@inproceedings{DBLP:conf/focs/JiangKLP020,
  author       = {Haotian Jiang and
                  Tarun Kathuria and
                  Yin Tat Lee and
                  Swati Padmanabhan and
                  Zhao Song},
  title        = {A Faster Interior Point Method for Semidefinite Programming},
  booktitle    = {{FOCS}},
  pages        = {910--918},
  publisher    = {{IEEE}},
  year         = {2020}
}
@inproceedings{DBLP:conf/focs/BrandLNPSS0W20,
  author       = {Jan van den Brand and
                  Yin Tat Lee and
                  Danupon Nanongkai and
                  Richard Peng and
                  Thatchaphol Saranurak and
                  Aaron Sidford and
                  Zhao Song and
                  Di Wang},
  title        = {Bipartite Matching in Nearly-linear Time on Moderately Dense Graphs},
  booktitle    = {{FOCS}},
  pages        = {919--930},
  publisher    = {{IEEE}},
  year         = {2020}
}
@inproceedings{DBLP:conf/icml/Huang0LA20,
  author       = {Yangsibo Huang and
                  Zhao Song and
                  Kai Li and
                  Sanjeev Arora},
  title        = {InstaHide: Instance-hiding Schemes for Private Distributed Learning},
  booktitle    = {{ICML}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {119},
  pages        = {4507--4518},
  publisher    = {{PMLR}},
  year         = {2020}
}
@inproceedings{DBLP:conf/icml/KongSSKO20,
  author       = {Weihao Kong and
                  Raghav Somani and
                  Zhao Song and
                  Sham M. Kakade and
                  Sewoong Oh},
  title        = {Meta-learning for Mixed Linear Regression},
  booktitle    = {{ICML}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {119},
  pages        = {5394--5404},
  publisher    = {{PMLR}},
  year         = {2020}
}
@inproceedings{DBLP:conf/nips/LeeSSWY20,
  author       = {Jason D. Lee and
                  Ruoqi Shen and
                  Zhao Song and
                  Mengdi Wang and
                  Zheng Yu},
  title        = {Generalized Leverage Score Sampling for Neural Networks},
  booktitle    = {NeurIPS},
  year         = {2020}
}
@inproceedings{DBLP:conf/nips/ZhangPDLSA20,
  author       = {Yi Zhang and
                  Orestis Plevrakis and
                  Simon S. Du and
                  Xingguo Li and
                  Zhao Song and
                  Sanjeev Arora},
  title        = {Over-parameterized Adversarial Training: An Analysis Overcoming the
                  Curse of Dimensionality},
  booktitle    = {NeurIPS},
  year         = {2020}
}
@inproceedings{DBLP:conf/soda/RubinsteinS20,
  author       = {Aviad Rubinstein and
                  Zhao Song},
  title        = {Reducing approximate Longest Common Subsequence to approximate Edit
                  Distance},
  booktitle    = {{SODA}},
  pages        = {1591--1600},
  publisher    = {{SIAM}},
  year         = {2020}
}
@inproceedings{DBLP:conf/stoc/Chen0S20,
  author       = {Sitan Chen and
                  Jerry Li and
                  Zhao Song},
  title        = {Learning mixtures of linear regressions in subexponential time via
                  Fourier moments},
  booktitle    = {{STOC}},
  pages        = {587--600},
  publisher    = {{ACM}},
  year         = {2020}
}
@inproceedings{DBLP:conf/stoc/BrandLSS20,
  author       = {Jan van den Brand and
                  Yin Tat Lee and
                  Aaron Sidford and
                  Zhao Song},
  title        = {Solving tall dense linear programs in nearly linear time},
  booktitle    = {{STOC}},
  pages        = {775--788},
  publisher    = {{ACM}},
  year         = {2020}
}
@inproceedings{DBLP:conf/stoc/JiangLSW20,
  author       = {Haotian Jiang and
                  Yin Tat Lee and
                  Zhao Song and
                  Sam Chiu{-}wai Wong},
  title        = {An improved cutting plane method for convex optimization, convex-concave
                  games, and its applications},
  booktitle    = {{STOC}},
  pages        = {944--953},
  publisher    = {{ACM}},
  year         = {2020}
}
@article{DBLP:journals/corr/abs-2002-02304,
  author       = {Jan van den Brand and
                  Yin Tat Lee and
                  Aaron Sidford and
                  Zhao Song},
  title        = {Solving Tall Dense Linear Programs in Nearly Linear Time},
  journal      = {CoRR},
  volume       = {abs/2002.02304},
  year         = {2020}
}
@article{DBLP:journals/corr/abs-2002-06668,
  author       = {Yi Zhang and
                  Orestis Plevrakis and
                  Simon S. Du and
                  Xingguo Li and
                  Zhao Song and
                  Sanjeev Arora},
  title        = {Over-parameterized Adversarial Training: An Analysis Overcoming the
                  Curse of Dimensionality},
  journal      = {CoRR},
  volume       = {abs/2002.06668},
  year         = {2020}
}
@article{DBLP:journals/corr/abs-2002-08936,
  author       = {Weihao Kong and
                  Raghav Somani and
                  Zhao Song and
                  Sham M. Kakade and
                  Sewoong Oh},
  title        = {Meta-learning for mixed linear regression},
  journal      = {CoRR},
  volume       = {abs/2002.08936},
  year         = {2020}
}
@article{DBLP:journals/corr/abs-2002-09812,
  author       = {Yingyu Liang and
                  Zhao Song and
                  Mengdi Wang and
                  Lin F. Yang and
                  Xin Yang},
  title        = {Sketching Transformed Matrices with Applications to Natural Language
                  Processing},
  journal      = {CoRR},
  volume       = {abs/2002.09812},
  year         = {2020}
}
@article{DBLP:journals/corr/abs-2003-01876,
  author       = {Yangsibo Huang and
                  Yushan Su and
                  Sachin Ravi and
                  Zhao Song and
                  Sanjeev Arora and
                  Kai Li},
  title        = {Privacy-preserving Learning via Deep Net Pruning},
  journal      = {CoRR},
  volume       = {abs/2003.01876},
  year         = {2020}
}
@article{DBLP:journals/corr/abs-2004-04250,
  author       = {Haotian Jiang and
                  Yin Tat Lee and
                  Zhao Song and
                  Sam Chiu{-}wai Wong},
  title        = {An Improved Cutting Plane Method for Convex Optimization, Convex-Concave
                  Games and its Applications},
  journal      = {CoRR},
  volume       = {abs/2004.04250},
  year         = {2020}
}
@article{DBLP:journals/corr/abs-2004-07470,
  author       = {Shunhua Jiang and
                  Zhao Song and
                  Omri Weinstein and
                  Hengjie Zhang},
  title        = {Faster Dynamic Matrix Inverse for Faster LPs},
  journal      = {CoRR},
  volume       = {abs/2004.07470},
  year         = {2020}
}
@article{DBLP:journals/corr/abs-2004-07986,
  author       = {Zhao Song and
                  David P. Woodruff and
                  Peilin Zhong},
  title        = {Average Case Column Subset Selection for Entrywise {\unicode{120001}}\({}_{\mbox{1}}\)-Norm
                  Loss},
  journal      = {CoRR},
  volume       = {abs/2004.07986},
  year         = {2020}
}
@article{DBLP:journals/corr/abs-2005-06156,
  author       = {Yaonan Jin and
                  Daogao Liu and
                  Zhao Song},
  title        = {A robust multi-dimensional sparse Fourier transform in the continuous
                  setting},
  journal      = {CoRR},
  volume       = {abs/2005.06156},
  year         = {2020}
}
@article{DBLP:journals/corr/abs-2006-05975,
  author       = {Simon S. Du and
                  Wei Hu and
                  Zhiyuan Li and
                  Ruoqi Shen and
                  Zhao Song and
                  Jiajun Wu},
  title        = {When is Particle Filtering Efficient for {POMDP} Sequential Planning?},
  journal      = {CoRR},
  volume       = {abs/2006.05975},
  year         = {2020}
}
@article{DBLP:journals/corr/abs-2006-11648,
  author       = {Jan van den Brand and
                  Binghui Peng and
                  Zhao Song and
                  Omri Weinstein},
  title        = {Training (Overparametrized) Neural Networks in Near-Linear Time},
  journal      = {CoRR},
  volume       = {abs/2006.11648},
  year         = {2020}
}
@article{DBLP:journals/corr/abs-2008-09593,
  author       = {Zhao Song and
                  Ruizhe Zhang},
  title        = {Hyperbolic Polynomials {I} : Concentration and Discrepancy},
  journal      = {CoRR},
  volume       = {abs/2008.09593},
  year         = {2020}
}
@article{DBLP:journals/corr/abs-2009-01802,
  author       = {Jan van den Brand and
                  Yin Tat Lee and
                  Danupon Nanongkai and
                  Richard Peng and
                  Thatchaphol Saranurak and
                  Aaron Sidford and
                  Zhao Song and
                  Di Wang},
  title        = {Bipartite Matching in Nearly-linear Time on Moderately Dense Graphs},
  journal      = {CoRR},
  volume       = {abs/2009.01802},
  year         = {2020}
}
@article{DBLP:journals/corr/abs-2009-06106,
  author       = {S. Cliff Liu and
                  Zhao Song and
                  Hengjie Zhang and
                  Lichen Zhang and
                  Tianyi Zhou},
  title        = {Space-Efficient Interior Point Method, with applications to Linear
                  Programming and Maximum Weight Bipartite Matching},
  journal      = {CoRR},
  volume       = {abs/2009.06106},
  year         = {2020}
}
@article{DBLP:journals/corr/abs-2009-07268,
  author       = {Andr{\'{a}}s Gily{\'{e}}n and
                  Zhao Song and
                  Ewin Tang},
  title        = {An improved quantum-inspired algorithm for linear regression},
  journal      = {CoRR},
  volume       = {abs/2009.07268},
  year         = {2020}
}
@article{DBLP:journals/corr/abs-2009-09829,
  author       = {Jason D. Lee and
                  Ruoqi Shen and
                  Zhao Song and
                  Mengdi Wang and
                  Zheng Yu},
  title        = {Generalized Leverage Score Sampling for Neural Networks},
  journal      = {CoRR},
  volume       = {abs/2009.09829},
  year         = {2020}
}
@article{DBLP:journals/corr/abs-2009-10217,
  author       = {Haotian Jiang and
                  Tarun Kathuria and
                  Yin Tat Lee and
                  Swati Padmanabhan and
                  Zhao Song},
  title        = {A Faster Interior Point Method for Semidefinite Programming},
  journal      = {CoRR},
  volume       = {abs/2009.10217},
  year         = {2020}
}
@article{DBLP:journals/corr/abs-2010-02772,
  author       = {Yangsibo Huang and
                  Zhao Song and
                  Kai Li and
                  Sanjeev Arora},
  title        = {InstaHide: Instance-hiding Schemes for Private Distributed Learning},
  journal      = {CoRR},
  volume       = {abs/2010.02772},
  year         = {2020}
}
@article{DBLP:journals/corr/abs-2010-06053,
  author       = {Yangsibo Huang and
                  Zhao Song and
                  Danqi Chen and
                  Kai Li and
                  Sanjeev Arora},
  title        = {TextHide: Tackling Data Privacy in Language Understanding Tasks},
  journal      = {CoRR},
  volume       = {abs/2010.06053},
  year         = {2020}
}
@article{DBLP:journals/corr/abs-2010-11463,
  author       = {Xiaoxiao Li and
                  Yangsibo Huang and
                  Binghui Peng and
                  Zhao Song and
                  Kai Li},
  title        = {MixCon: Adjusting the Separability of Data Representations for Harder
                  Data Recovery},
  journal      = {CoRR},
  volume       = {abs/2010.11463},
  year         = {2020}
}
@article{DBLP:journals/corr/abs-2011-02466,
  author       = {Josh Alman and
                  Timothy Chu and
                  Aaron Schild and
                  Zhao Song},
  title        = {Algorithms and Hardness for Linear Algebra on Geometric Graphs},
  journal      = {CoRR},
  volume       = {abs/2011.02466},
  year         = {2020}
}
@article{DBLP:journals/corr/abs-2011-11181,
  author       = {Sitan Chen and
                  Zhao Song and
                  Danyang Zhuo},
  title        = {On InstaHide, Phase Retrieval, and Sparse Matrix Factorization},
  journal      = {CoRR},
  volume       = {abs/2011.11181},
  year         = {2020}
}
@article{DBLP:journals/corr/abs-2011-11877,
  author       = {Baihe Huang and
                  Zhao Song and
                  Runzhou Tao and
                  Ruizhe Zhang and
                  Danyang Zhuo},
  title        = {InstaHide's Sample Complexity When Mixing Two Private Images},
  journal      = {CoRR},
  volume       = {abs/2011.11877},
  year         = {2020}
}
@article{DBLP:journals/jmlr/BalcanLSW019,
  author       = {Maria{-}Florina Balcan and
                  Yingyu Liang and
                  Zhao Song and
                  David P. Woodruff and
                  Hongyang Zhang},
  title        = {Non-Convex Matrix Completion and Related Problems via Strong Duality},
  journal      = {J. Mach. Learn. Res.},
  volume       = {20},
  pages        = {102:1--102:56},
  year         = {2019}
}
@inproceedings{DBLP:conf/aistats/LinSY19,
  author       = {Yibo Lin and
                  Zhao Song and
                  Lin F. Yang},
  title        = {Towards a Theoretical Understanding of Hashing-Based Neural Nets},
  booktitle    = {{AISTATS}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {89},
  pages        = {127--137},
  publisher    = {{PMLR}},
  year         = {2019}
}
@inproceedings{DBLP:conf/colt/LeeSZ19,
  author       = {Yin Tat Lee and
                  Zhao Song and
                  Qiuyi Zhang},
  title        = {Solving Empirical Risk Minimization in the Current Matrix Multiplication
                  Time},
  booktitle    = {{COLT}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {99},
  pages        = {2140--2157},
  publisher    = {{PMLR}},
  year         = {2019}
}
@inproceedings{DBLP:conf/focs/RubinsteinSSS19,
  author       = {Aviad Rubinstein and
                  Saeed Seddighin and
                  Zhao Song and
                  Xiaorui Sun},
  title        = {Approximation Algorithms for {LCS} and {LIS} with Truly Improved Running
                  Times},
  booktitle    = {{FOCS}},
  pages        = {1121--1145},
  publisher    = {{IEEE} Computer Society},
  year         = {2019}
}
@inproceedings{DBLP:conf/focs/NakosSW19,
  author       = {Vasileios Nakos and
                  Zhao Song and
                  Zhengyu Wang},
  title        = {(Nearly) Sample-Optimal Sparse Fourier Transform in Any Dimension;
                  RIPless and Filterless},
  booktitle    = {{FOCS}},
  pages        = {1568--1577},
  publisher    = {{IEEE} Computer Society},
  year         = {2019}
}
@inproceedings{DBLP:conf/iclr/ZhangCSBDH19,
  author       = {Huan Zhang and
                  Hongge Chen and
                  Zhao Song and
                  Duane S. Boning and
                  Inderjit S. Dhillon and
                  Cho{-}Jui Hsieh},
  title        = {The Limitations of Adversarial Training and the Blind-Spot Attack},
  booktitle    = {{ICLR} (Poster)},
  publisher    = {OpenReview.net},
  year         = {2019}
}
@inproceedings{DBLP:conf/icml/Allen-ZhuLS19,
  author       = {Zeyuan Allen{-}Zhu and
                  Yuanzhi Li and
                  Zhao Song},
  title        = {A Convergence Theory for Deep Learning via Over-Parameterization},
  booktitle    = {{ICML}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {97},
  pages        = {242--252},
  publisher    = {{PMLR}},
  year         = {2019}
}
@inproceedings{DBLP:conf/nips/SongWYZZ19,
  author       = {Zhao Song and
                  Ruosong Wang and
                  Lin F. Yang and
                  Hongyang Zhang and
                  Peilin Zhong},
  title        = {Efficient Symmetric Norm Regression via Linear Sketching},
  booktitle    = {NeurIPS},
  pages        = {828--838},
  year         = {2019}
}
@inproceedings{DBLP:conf/nips/DiaoSWY19,
  author       = {Huaian Diao and
                  Zhao Song and
                  David P. Woodruff and
                  Xin Yang},
  title        = {Total Least Squares Regression in Input Sparsity Time},
  booktitle    = {NeurIPS},
  pages        = {2478--2489},
  year         = {2019}
}
@inproceedings{DBLP:conf/nips/DiaoJSSW19,
  author       = {Huaian Diao and
                  Rajesh Jayaram and
                  Zhao Song and
                  Wen Sun and
                  David P. Woodruff},
  title        = {Optimal Sketching for Kronecker Product Regression and Low Rank Approximation},
  booktitle    = {NeurIPS},
  pages        = {4739--4750},
  year         = {2019}
}
@inproceedings{DBLP:conf/nips/SongWZ19,
  author       = {Zhao Song and
                  David P. Woodruff and
                  Peilin Zhong},
  title        = {Towards a Zero-One Law for Column Subset Selection},
  booktitle    = {NeurIPS},
  pages        = {6120--6131},
  year         = {2019}
}
@inproceedings{DBLP:conf/nips/Allen-ZhuLS19,
  author       = {Zeyuan Allen{-}Zhu and
                  Yuanzhi Li and
                  Zhao Song},
  title        = {On the Convergence Rate of Training Recurrent Neural Networks},
  booktitle    = {NeurIPS},
  pages        = {6673--6685},
  year         = {2019}
}
@inproceedings{DBLP:conf/nips/SongWZ19a,
  author       = {Zhao Song and
                  David P. Woodruff and
                  Peilin Zhong},
  title        = {Average Case Column Subset Selection for Entrywise {\unicode{54465}}\({}_{\mbox{1}}\)-Norm
                  Loss},
  booktitle    = {NeurIPS},
  pages        = {10111--10121},
  year         = {2019}
}
@inproceedings{DBLP:conf/nips/ZhongS0D19,
  author       = {Kai Zhong and
                  Zhao Song and
                  Prateek Jain and
                  Inderjit S. Dhillon},
  title        = {Provable Non-linear Inductive Matrix Completion},
  booktitle    = {NeurIPS},
  pages        = {11435--11445},
  year         = {2019}
}
@inproceedings{DBLP:conf/soda/SongWZ19,
  author       = {Zhao Song and
                  David P. Woodruff and
                  Peilin Zhong},
  title        = {Relative Error Tensor Low Rank Approximation},
  booktitle    = {{SODA}},
  pages        = {2772--2789},
  publisher    = {{SIAM}},
  year         = {2019}
}
@inproceedings{DBLP:conf/stoc/NakosS19,
  author       = {Vasileios Nakos and
                  Zhao Song},
  title        = {Stronger l\({}_{\mbox{2}}\)/l\({}_{\mbox{2}}\) compressed sensing;
                  without iterating},
  booktitle    = {{STOC}},
  pages        = {289--297},
  publisher    = {{ACM}},
  year         = {2019}
}
@inproceedings{DBLP:conf/stoc/CohenLS19,
  author       = {Michael B. Cohen and
                  Yin Tat Lee and
                  Zhao Song},
  title        = {Solving linear programs in the current matrix multiplication time},
  booktitle    = {{STOC}},
  pages        = {938--942},
  publisher    = {{ACM}},
  year         = {2019}
}
@article{DBLP:journals/corr/abs-1901-04684,
  author       = {Huan Zhang and
                  Hongge Chen and
                  Zhao Song and
                  Duane S. Boning and
                  Inderjit S. Dhillon and
                  Cho{-}Jui Hsieh},
  title        = {The Limitations of Adversarial Training and the Blind-Spot Attack},
  journal      = {CoRR},
  volume       = {abs/1901.04684},
  year         = {2019}
}
@article{DBLP:journals/corr/abs-1901-06731,
  author       = {Rasmus Kyng and
                  Kyle Luh and
                  Zhao Song},
  title        = {Four Deviations Suffice for Rank 1 Matrices},
  journal      = {CoRR},
  volume       = {abs/1901.06731},
  year         = {2019}
}
@article{DBLP:journals/corr/abs-1903-02742,
  author       = {Vasileios Nakos and
                  Zhao Song},
  title        = {Stronger {L2/L2} Compressed Sensing; Without Iterating},
  journal      = {CoRR},
  volume       = {abs/1903.02742},
  year         = {2019}
}
@article{DBLP:journals/corr/abs-1904-05451,
  author       = {Aviad Rubinstein and
                  Zhao Song},
  title        = {Reducing approximate Longest Common Subsequence to approximate Edit
                  Distance},
  journal      = {CoRR},
  volume       = {abs/1904.05451},
  year         = {2019}
}
@article{DBLP:journals/corr/abs-1905-00475,
  author       = {Zhao Song and
                  Wen Sun},
  title        = {Efficient Model-free Reinforcement Learning in Metric Spaces},
  journal      = {CoRR},
  volume       = {abs/1905.00475},
  year         = {2019}
}
@article{DBLP:journals/corr/abs-1905-04447,
  author       = {Yin Tat Lee and
                  Zhao Song and
                  Qiuyi Zhang},
  title        = {Solving Empirical Risk Minimization in the Current Matrix Multiplication
                  Time},
  journal      = {CoRR},
  volume       = {abs/1905.04447},
  year         = {2019}
}
@article{DBLP:journals/corr/abs-1906-03593,
  author       = {Zhao Song and
                  Xin Yang},
  title        = {Quadratic Suffices for Over-parametrization via Matrix Chernoff Bound},
  journal      = {CoRR},
  volume       = {abs/1906.03593},
  year         = {2019}
}
@article{DBLP:journals/corr/abs-1909-11123,
  author       = {Vasileios Nakos and
                  Zhao Song and
                  Zhengyu Wang},
  title        = {(Nearly) Sample-Optimal Sparse Fourier Transform in Any Dimension;
                  RIPless and Filterless},
  journal      = {CoRR},
  volume       = {abs/1909.11123},
  year         = {2019}
}
@article{DBLP:journals/corr/abs-1909-12441,
  author       = {Huaian Diao and
                  Zhao Song and
                  David P. Woodruff and
                  Xin Yang},
  title        = {Total Least Squares Regression in Input Sparsity Time},
  journal      = {CoRR},
  volume       = {abs/1909.12441},
  year         = {2019}
}
@article{DBLP:journals/corr/abs-1909-13384,
  author       = {Huaian Diao and
                  Rajesh Jayaram and
                  Zhao Song and
                  Wen Sun and
                  David P. Woodruff},
  title        = {Optimal Sketching for Kronecker Product Regression and Low Rank Approximation},
  journal      = {CoRR},
  volume       = {abs/1909.13384},
  year         = {2019}
}
@article{DBLP:journals/corr/abs-1910-01788,
  author       = {Zhao Song and
                  Ruosong Wang and
                  Lin F. Yang and
                  Hongyang Zhang and
                  Peilin Zhong},
  title        = {Efficient Symmetric Norm Regression via Linear Sketching},
  journal      = {CoRR},
  volume       = {abs/1910.01788},
  year         = {2019}
}
@article{DBLP:journals/corr/abs-1912-07629,
  author       = {Sitan Chen and
                  Jerry Li and
                  Zhao Song},
  title        = {Learning Mixtures of Linear Regressions in Subexponential Time via
                  Fourier Moments},
  journal      = {CoRR},
  volume       = {abs/1912.07629},
  year         = {2019}
}
@article{DBLP:journals/tcs/BeregB0KMS18,
  author       = {Sergey Bereg and
                  Binay Bhattacharya and
                  Sandip Das and
                  Tsunehiko Kameda and
                  Priya Ranjan Sinha Mahapatra and
                  Zhao Song},
  title        = {Optimizing squares covering a set of points},
  journal      = {Theor. Comput. Sci.},
  volume       = {729},
  pages        = {68--83},
  year         = {2018}
}
@inproceedings{DBLP:conf/aistats/LiauSPY18,
  author       = {David Liau and
                  Zhao Song and
                  Eric Price and
                  Ger Yang},
  title        = {Stochastic Multi-armed Bandits in Constant Space},
  booktitle    = {{AISTATS}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {84},
  pages        = {386--394},
  publisher    = {{PMLR}},
  year         = {2018}
}
@inproceedings{DBLP:conf/aistats/DiaoSSW18,
  author       = {Huaian Diao and
                  Zhao Song and
                  Wen Sun and
                  David P. Woodruff},
  title        = {Sketching for Kronecker Product Regression and P-splines},
  booktitle    = {{AISTATS}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {84},
  pages        = {1299--1308},
  publisher    = {{PMLR}},
  year         = {2018}
}
@inproceedings{DBLP:conf/focs/KyngS18,
  author       = {Rasmus Kyng and
                  Zhao Song},
  title        = {A Matrix Chernoff Bound for Strongly Rayleigh Distributions and Spectral
                  Sparsifiers from a few Random Spanning Trees},
  booktitle    = {{FOCS}},
  pages        = {373--384},
  publisher    = {{IEEE} Computer Society},
  year         = {2018}
}
@inproceedings{DBLP:conf/focs/AndoniSSWZ18,
  author       = {Alexandr Andoni and
                  Zhao Song and
                  Clifford Stein and
                  Zhengyu Wang and
                  Peilin Zhong},
  title        = {Parallel Graph Connectivity in Log Diameter Rounds},
  booktitle    = {{FOCS}},
  pages        = {674--685},
  publisher    = {{IEEE} Computer Society},
  year         = {2018}
}
@inproceedings{DBLP:conf/icml/WengZCSHDBD18,
  author       = {Tsui{-}Wei Weng and
                  Huan Zhang and
                  Hongge Chen and
                  Zhao Song and
                  Cho{-}Jui Hsieh and
                  Luca Daniel and
                  Duane S. Boning and
                  Inderjit S. Dhillon},
  title        = {Towards Fast Computation of Certified Robustness for ReLU Networks},
  booktitle    = {{ICML}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {80},
  pages        = {5273--5282},
  publisher    = {{PMLR}},
  year         = {2018}
}
@inproceedings{DBLP:conf/icml/ZhangLSD18,
  author       = {Jiong Zhang and
                  Yibo Lin and
                  Zhao Song and
                  Inderjit S. Dhillon},
  title        = {Learning Long Term Dependencies via Fourier Recurrent Units},
  booktitle    = {{ICML}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {80},
  pages        = {5810--5818},
  publisher    = {{PMLR}},
  year         = {2018}
}
@inproceedings{DBLP:conf/stoc/GargLSS18,
  author       = {Ankit Garg and
                  Yin Tat Lee and
                  Zhao Song and
                  Nikhil Srivastava},
  title        = {A matrix expander Chernoff bound},
  booktitle    = {{STOC}},
  pages        = {1102--1114},
  publisher    = {{ACM}},
  year         = {2018}
}
@incollection{DBLP:reference/snam/HuSE18,
  author       = {Bo Hu and
                  Zhao Song and
                  Martin Ester},
  title        = {Topic Modeling in Online Social Media, User Features and Social Networks
                  for},
  booktitle    = {Encyclopedia of Social Network Analysis and Mining. 2nd Ed},
  publisher    = {Springer},
  year         = {2018}
}
@article{DBLP:journals/corr/abs-1802-00459,
  author       = {Zhao Song and
                  Lin F. Yang and
                  Peilin Zhong},
  title        = {Sensitivity Sampling Over Dynamic Geometric Data Streams with Applications
                  to k-Clustering},
  journal      = {CoRR},
  volume       = {abs/1802.00459},
  year         = {2018}
}
@article{DBLP:journals/corr/abs-1803-06585,
  author       = {Jiong Zhang and
                  Yibo Lin and
                  Zhao Song and
                  Inderjit S. Dhillon},
  title        = {Learning Long Term Dependencies via Fourier Recurrent Units},
  journal      = {CoRR},
  volume       = {abs/1803.06585},
  year         = {2018}
}
@article{DBLP:journals/corr/abs-1804-09699,
  author       = {Tsui{-}Wei Weng and
                  Huan Zhang and
                  Hongge Chen and
                  Zhao Song and
                  Cho{-}Jui Hsieh and
                  Duane S. Boning and
                  Inderjit S. Dhillon and
                  Luca Daniel},
  title        = {Towards Fast Computation of Certified Robustness for ReLU Networks},
  journal      = {CoRR},
  volume       = {abs/1804.09699},
  year         = {2018}
}
@article{DBLP:journals/corr/abs-1805-03055,
  author       = {Alexandr Andoni and
                  Clifford Stein and
                  Zhao Song and
                  Zhengyu Wang and
                  Peilin Zhong},
  title        = {Parallel Graph Connectivity in Log Diameter Rounds},
  journal      = {CoRR},
  volume       = {abs/1805.03055},
  year         = {2018}
}
@article{DBLP:journals/corr/abs-1805-10477,
  author       = {Kai Zhong and
                  Zhao Song and
                  Prateek Jain and
                  Inderjit S. Dhillon},
  title        = {Nonlinear Inductive Matrix Completion based on One-layer Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1805.10477},
  year         = {2018}
}
@article{DBLP:journals/corr/abs-1810-07896,
  author       = {Michael B. Cohen and
                  Yin Tat Lee and
                  Zhao Song},
  title        = {Solving Linear Programs in the Current Matrix Multiplication Time},
  journal      = {CoRR},
  volume       = {abs/1810.07896},
  year         = {2018}
}
@article{DBLP:journals/corr/abs-1810-08345,
  author       = {Rasmus Kyng and
                  Zhao Song},
  title        = {A Matrix Chernoff Bound for Strongly Rayleigh Distributions and Spectral
                  Sparsifiers from a few Random Spanning Trees},
  journal      = {CoRR},
  volume       = {abs/1810.08345},
  year         = {2018}
}
@article{DBLP:journals/corr/abs-1810-12065,
  author       = {Zeyuan Allen{-}Zhu and
                  Yuanzhi Li and
                  Zhao Song},
  title        = {On the Convergence Rate of Training Recurrent Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1810.12065},
  year         = {2018}
}
@article{DBLP:journals/corr/abs-1811-01442,
  author       = {Zhao Song and
                  David P. Woodruff and
                  Peilin Zhong},
  title        = {Towards a Zero-One Law for Entrywise Low Rank Approximation},
  journal      = {CoRR},
  volume       = {abs/1811.01442},
  year         = {2018}
}
@article{DBLP:journals/corr/abs-1811-03962,
  author       = {Zeyuan Allen{-}Zhu and
                  Yuanzhi Li and
                  Zhao Song},
  title        = {A Convergence Theory for Deep Learning via Over-Parameterization},
  journal      = {CoRR},
  volume       = {abs/1811.03962},
  year         = {2018}
}
@article{DBLP:journals/corr/abs-1812-06243,
  author       = {Yin Tat Lee and
                  Zhao Song and
                  Santosh S. Vempala},
  title        = {Algorithmic Theory of ODEs and Sampling from Well-conditioned Logconcave
                  Densities},
  journal      = {CoRR},
  volume       = {abs/1812.06243},
  year         = {2018}
}
@article{DBLP:journals/corr/abs-1812-10244,
  author       = {Yibo Lin and
                  Zhao Song and
                  Lin F. Yang},
  title        = {Towards a Theoretical Understanding of Hashing-Based Neural Nets},
  journal      = {CoRR},
  volume       = {abs/1812.10244},
  year         = {2018}
}
@article{DBLP:journals/eccc/SongWZ18,
  author       = {Zhao Song and
                  David P. Woodruff and
                  Peilin Zhong},
  title        = {Relative Error Tensor Low Rank Approximation},
  journal      = {Electron. Colloquium Comput. Complex.},
  volume       = {{TR18-103}},
  year         = {2018}
}
@inproceedings{DBLP:conf/icalp/PriceSW17,
  author       = {Eric Price and
                  Zhao Song and
                  David P. Woodruff},
  title        = {Fast Regression with an {\textdollar}ell{\_}infty{\textdollar} Guarantee},
  booktitle    = {{ICALP}},
  series       = {LIPIcs},
  volume       = {80},
  pages        = {59:1--59:14},
  publisher    = {Schloss Dagstuhl - Leibniz-Zentrum f{\"{u}}r Informatik},
  year         = {2017}
}
@inproceedings{DBLP:conf/icml/ZhongS0BD17,
  author       = {Kai Zhong and
                  Zhao Song and
                  Prateek Jain and
                  Peter L. Bartlett and
                  Inderjit S. Dhillon},
  title        = {Recovery Guarantees for One-hidden-layer Neural Networks},
  booktitle    = {{ICML}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {70},
  pages        = {4140--4149},
  publisher    = {{PMLR}},
  year         = {2017}
}
@inproceedings{DBLP:conf/stoc/SongWZ17,
  author       = {Zhao Song and
                  David P. Woodruff and
                  Peilin Zhong},
  title        = {Low rank approximation with entrywise l\({}_{\mbox{1}}\)-norm error},
  booktitle    = {{STOC}},
  pages        = {688--701},
  publisher    = {{ACM}},
  year         = {2017}
}
@article{DBLP:journals/corr/SongWZ17,
  author       = {Zhao Song and
                  David P. Woodruff and
                  Peilin Zhong},
  title        = {Relative Error Tensor Low Rank Approximation},
  journal      = {CoRR},
  volume       = {abs/1704.08246},
  year         = {2017}
}
@article{DBLP:journals/corr/PriceSW17,
  author       = {Eric Price and
                  Zhao Song and
                  David P. Woodruff},
  title        = {Fast Regression with an {\textdollar}{\textbackslash}ell{\_}{\textbackslash}infty{\textdollar}
                  Guarantee},
  journal      = {CoRR},
  volume       = {abs/1705.10723},
  year         = {2017}
}
@article{DBLP:journals/corr/ZhongS0BD17,
  author       = {Kai Zhong and
                  Zhao Song and
                  Prateek Jain and
                  Peter L. Bartlett and
                  Inderjit S. Dhillon},
  title        = {Recovery Guarantees for One-hidden-layer Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1706.03175},
  year         = {2017}
}
@article{DBLP:journals/corr/abs-1711-03440,
  author       = {Kai Zhong and
                  Zhao Song and
                  Inderjit S. Dhillon},
  title        = {Learning Non-overlapping Convolutional Neural Networks with Multiple
                  Kernels},
  journal      = {CoRR},
  volume       = {abs/1711.03440},
  year         = {2017}
}
@article{DBLP:journals/corr/abs-1712-09007,
  author       = {David Liau and
                  Eric Price and
                  Zhao Song and
                  Ger Yang},
  title        = {Stochastic Multi-armed Bandits in Constant Space},
  journal      = {CoRR},
  volume       = {abs/1712.09007},
  year         = {2017}
}
@article{DBLP:journals/corr/abs-1712-09473,
  author       = {Huaian Diao and
                  Zhao Song and
                  Wen Sun and
                  David P. Woodruff},
  title        = {Sketching for Kronecker Product Regression and P-splines},
  journal      = {CoRR},
  volume       = {abs/1712.09473},
  year         = {2017}
}
@article{DBLP:journals/tit/RawatSDG16,
  author       = {Ankit Singh Rawat and
                  Zhao Song and
                  Alexandros G. Dimakis and
                  Anna G{\'{a}}l},
  title        = {Batch Codes Through Dense Graphs Without Short Cycles},
  journal      = {{IEEE} Trans. Inf. Theory},
  volume       = {62},
  number       = {4},
  pages        = {1592--1604},
  year         = {2016}
}
@inproceedings{DBLP:conf/focs/ChenKPS16,
  author       = {Xue Chen and
                  Daniel M. Kane and
                  Eric Price and
                  Zhao Song},
  title        = {Fourier-Sparse Interpolation without a Frequency Gap},
  booktitle    = {{FOCS}},
  pages        = {741--750},
  publisher    = {{IEEE} Computer Society},
  year         = {2016}
}
@inproceedings{DBLP:conf/ijcai/ZhangS16,
  author       = {Ruohan Zhang and
                  Zhao Song},
  title        = {Maximum Sustainable Yield Problem for Robot Foraging and Construction
                  System},
  booktitle    = {{IJCAI}},
  pages        = {2725--2731},
  publisher    = {{IJCAI/AAAI} Press},
  year         = {2016}
}
@inproceedings{DBLP:conf/nips/SongWZ16,
  author       = {Zhao Song and
                  David P. Woodruff and
                  Huan Zhang},
  title        = {Sublinear Time Orthogonal Tensor Decomposition},
  booktitle    = {{NIPS}},
  pages        = {793--801},
  year         = {2016}
}
@inproceedings{DBLP:conf/stoc/RazenshteynSW16,
  author       = {Ilya P. Razenshteyn and
                  Zhao Song and
                  David P. Woodruff},
  title        = {Weighted low rank approximations with provable guarantees},
  booktitle    = {{STOC}},
  pages        = {250--263},
  publisher    = {{ACM}},
  year         = {2016}
}
@inproceedings{DBLP:conf/swat/BanikBDKS16,
  author       = {Aritra Banik and
                  Binay K. Bhattacharya and
                  Sandip Das and
                  Tsunehiko Kameda and
                  Zhao Song},
  title        = {The p-Center Problem in Tree Networks Revisited},
  booktitle    = {{SWAT}},
  series       = {LIPIcs},
  volume       = {53},
  pages        = {6:1--6:15},
  publisher    = {Schloss Dagstuhl - Leibniz-Zentrum f{\"{u}}r Informatik},
  year         = {2016}
}
@article{DBLP:journals/corr/BanikBDKS16,
  author       = {Aritra Banik and
                  Binay K. Bhattacharya and
                  Sandip Das and
                  Tsunehiko Kameda and
                  Zhao Song},
  title        = {The {\textdollar}p{\textdollar}-Center Problem in Tree Networks Revisited},
  journal      = {CoRR},
  volume       = {abs/1604.07535},
  year         = {2016}
}
@article{DBLP:journals/corr/PriceS16,
  author       = {Eric Price and
                  Zhao Song},
  title        = {A Robust Sparse Fourier Transform in the Continuous Setting},
  journal      = {CoRR},
  volume       = {abs/1609.00896},
  year         = {2016}
}
@article{DBLP:journals/corr/ChenKPS16,
  author       = {Xue Chen and
                  Daniel M. Kane and
                  Eric Price and
                  Zhao Song},
  title        = {Fourier-sparse interpolation without a frequency gap},
  journal      = {CoRR},
  volume       = {abs/1609.01361},
  year         = {2016}
}
@article{DBLP:journals/corr/SongWZ16,
  author       = {Zhao Song and
                  David P. Woodruff and
                  Peilin Zhong},
  title        = {Low Rank Approximation with Entrywise {\(\mathscr{l}\)}\({}_{\mbox{1}}\)-Norm
                  Error},
  journal      = {CoRR},
  volume       = {abs/1611.00898},
  year         = {2016}
}
@article{DBLP:journals/dam/BhattacharyaKS15,
  author       = {Binay Bhattacharya and
                  Tsunehiko Kameda and
                  Zhao Song},
  title        = {Minmax regret 1-center algorithms for path/tree/unicycle/cactus networks},
  journal      = {Discret. Appl. Math.},
  volume       = {195},
  pages        = {18--30},
  year         = {2015}
}
@inproceedings{DBLP:conf/aaai/ZhangSB15,
  author       = {Ruohan Zhang and
                  Zhao Song and
                  Dana H. Ballard},
  title        = {Global Policy Construction in Modular Reinforcement Learning},
  booktitle    = {{AAAI}},
  pages        = {4226--4227},
  publisher    = {{AAAI} Press},
  year         = {2015}
}
@inproceedings{DBLP:conf/dac/WangLYSOC15,
  author       = {Ye Wang and
                  Meng Li and
                  Xinyang Yi and
                  Zhao Song and
                  Michael Orshansky and
                  Constantine Caramanis},
  title        = {Novel power grid reduction method based on {L1} regularization},
  booktitle    = {{DAC}},
  pages        = {93:1--93:6},
  publisher    = {{ACM}},
  year         = {2015}
}
@inproceedings{DBLP:conf/focs/PriceS15,
  author       = {Eric Price and
                  Zhao Song},
  title        = {A Robust Sparse Fourier Transform in the Continuous Setting},
  booktitle    = {{FOCS}},
  pages        = {583--600},
  publisher    = {{IEEE} Computer Society},
  year         = {2015}
}
@inproceedings{DBLP:conf/isit/RawatSDG15,
  author       = {Ankit Singh Rawat and
                  Zhao Song and
                  Alexandros G. Dimakis and
                  Anna G{\'{a}}l},
  title        = {Batch codes through dense graphs without short cycles},
  booktitle    = {{ISIT}},
  pages        = {1477--1481},
  publisher    = {{IEEE}},
  year         = {2015}
}
@article{DBLP:journals/algorithmica/BhattacharyaKS14,
  author       = {Binay K. Bhattacharya and
                  Tsunehiko Kameda and
                  Zhao Song},
  title        = {A Linear Time Algorithm for Computing Minmax Regret 1-Median on a
                  Tree Network},
  journal      = {Algorithmica},
  volume       = {70},
  number       = {1},
  pages        = {2--21},
  year         = {2014}
}
@inproceedings{DBLP:conf/atal/SongS14,
  author       = {Zhao Song and
                  Wen Sun},
  title        = {Probabilistic recharging model in uncertain environments},
  booktitle    = {{AAMAS}},
  pages        = {1343--1344},
  publisher    = {{IFAAMAS/ACM}},
  year         = {2014}
}
@inproceedings{DBLP:conf/cocoa/BhattacharyaDKMS14,
  author       = {Binay K. Bhattacharya and
                  Sandip Das and
                  Tsunehiko Kameda and
                  Priya Ranjan Sinha Mahapatra and
                  Zhao Song},
  title        = {Optimizing Squares Covering a Set of Points},
  booktitle    = {{COCOA}},
  series       = {Lecture Notes in Computer Science},
  volume       = {8881},
  pages        = {37--52},
  publisher    = {Springer},
  year         = {2014}
}
@inproceedings{DBLP:conf/cocoon/BhattacharyaDKRSS14,
  author       = {Binay K. Bhattacharya and
                  Minati De and
                  Tsunehiko Kameda and
                  Sasanka Roy and
                  Vladyslav Sokol and
                  Zhao Song},
  title        = {Back-Up 2-Center on a Path/Tree/Cycle/Unicycle},
  booktitle    = {{COCOON}},
  series       = {Lecture Notes in Computer Science},
  volume       = {8591},
  pages        = {417--428},
  publisher    = {Springer},
  year         = {2014}
}
@inproceedings{DBLP:conf/latin/BhattacharyaKS14,
  author       = {Binay K. Bhattacharya and
                  Tsunehiko Kameda and
                  Zhao Song},
  title        = {Improved Minmax Regret 1-Center Algorithms for Cactus Networks with
                  c Cycles},
  booktitle    = {{LATIN}},
  series       = {Lecture Notes in Computer Science},
  volume       = {8392},
  pages        = {330--341},
  publisher    = {Springer},
  year         = {2014}
}
@incollection{DBLP:reference/snam/HuSE14,
  author       = {Bo Hu and
                  Zhao Song and
                  Martin Ester},
  title        = {Topic Modeling in Online Social Media, User Features, and Social Networks
                  for},
  booktitle    = {Encyclopedia of Social Network Analysis and Mining},
  pages        = {2178--2191},
  year         = {2014}
}
@article{DBLP:journals/corr/DimakisGRS14,
  author       = {Alexandros G. Dimakis and
                  Anna G{\'{a}}l and
                  Ankit Singh Rawat and
                  Zhao Song},
  title        = {Batch Codes through Dense Graphs without Short Cycles},
  journal      = {CoRR},
  volume       = {abs/1410.2920},
  year         = {2014}
}
@article{DBLP:journals/eccc/DimakisGRS14,
  author       = {Alexandros G. Dimakis and
                  Anna G{\'{a}}l and
                  Ankit Singh Rawat and
                  Zhao Song},
  title        = {Batch Codes through Dense Graphs without Short Cycles},
  journal      = {Electron. Colloquium Comput. Complex.},
  volume       = {{TR14-127}},
  year         = {2014}
}
@inproceedings{DBLP:conf/aaai/SongZ13,
  author       = {Zhao Song and
                  Yuke Zhu},
  title        = {Graphical Model-Based Learning in High Dimensional Feature Spaces},
  booktitle    = {{AAAI}},
  pages        = {1641--1642},
  publisher    = {{AAAI} Press},
  year         = {2013}
}
@inproceedings{DBLP:conf/iros/SongV13,
  author       = {Zhao Song and
                  Richard T. Vaughan},
  title        = {Sustainable robot foraging: Adaptive fine-grained multi-robot task
                  allocation for maximum sustainable yield of biological resources},
  booktitle    = {{IROS}},
  pages        = {3309--3316},
  publisher    = {{IEEE}},
  year         = {2013}
}
@inproceedings{DBLP:conf/aamas/SongSV12,
  author       = {Zhao Song and
                  Seyed Abbas Sadat and
                  Richard T. Vaughan},
  title        = {{MO-LOST:} adaptive ant trail untangling in multi-objective multi-colony
                  robot foraging},
  booktitle    = {{AAMAS}},
  pages        = {1199--1200},
  publisher    = {{IFAAMAS}},
  year         = {2012}
}
@inproceedings{DBLP:conf/asunam/HuSE12,
  author       = {Bo Hu and
                  Zhao Song and
                  Martin Ester},
  title        = {User Features and Social Networks for Topic Modeling in Online Social
                  Media},
  booktitle    = {{ASONAM}},
  pages        = {202--209},
  publisher    = {{IEEE} Computer Society},
  year         = {2012}
}
@inproceedings{DBLP:conf/isaac/BhattacharyaKS12,
  author       = {Binay K. Bhattacharya and
                  Tsunehiko Kameda and
                  Zhao Song},
  title        = {Computing Minmax Regret 1-Median on a Tree Network with Positive/Negative
                  Vertex Weights},
  booktitle    = {{ISAAC}},
  series       = {Lecture Notes in Computer Science},
  volume       = {7676},
  pages        = {588--597},
  publisher    = {Springer},
  year         = {2012}
}