1b:["$","$L29",null,{"isWhiteLabelled":false,"children":["$","$Lb",null,{"pt":{"compact":0,"expanded":3},"children":[["$","$L2a",null,{"noStar":true,"publisher":true,"task":true,"params":true,"size":"xl","product":{"id":"eyJwYXBlcklEIjoiMTkwMy4wMzYwNSIsInB1Ymxpc2hlciI6ImFyeGl2In0=","publisher":"arxiv","updated":"2020-03-26T17:51:43.000Z","paperID":"1903.03605","published":"2019-03-08T18:50:42.000Z","authors":"[\"Meena Jagadeesan\"]","title":"Understanding Sparse JL for Feature Hashing","scoreTrending":null,"summary":"$2b","lastCheckedForCode":"2022-09-06T08:17:55.028Z","links":[{"id":"eyJ1cmwiOiJodHRwczovL3BhcGVyc3dpdGhjb2RlLmNvbS9wYXBlci91bmRlcnN0YW5kaW5nLXNwYXJzZS1qbC1mb3ItZmVhdHVyZS1oYXNoaW5nIn0=","type":"pwc","url":"https://paperswithcode.com/paper/understanding-sparse-jl-for-feature-hashing","data":null},{"id":"eyJ1cmwiOiJodHRwczovL2dpdGh1Yi5jb20vbWphZ2FkZWVzYW4vc3BhcnNlamwtZmVhdHVyZWhhc2hpbmcifQ==","type":"code","url":"https://github.com/mjagadeesan/sparsejl-featurehashing","data":null}],"reposConnection":{"edges":[{"official":null,"node":{"id":"eyJyZXBvSUQiOiIyMTc3OTg3MjciLCJzb3VyY2UiOiJnaXRodWIifQ==","source":"github","repoID":"217798727","url":"https://github.com/mjagadeesan/sparsejl-featurehashing","title":"sparsejl-featurehashing","language":"python","stars":4,"forks":0,"framework":null,"scoreTrending":null,"updated":null,"created":null,"downloads":null,"likes":null,"owner":[{"username":"mjagadeesan","avatar":"https://avatars.githubusercontent.com/u/25335097?v=4"}]}}]},"models":[],"tags":[],"summaries":[],"emailsConnection":{"edges":[{"author":"meena jagadeesan","node":{"id":"eyJhZGRyZXNzIjoibWphZ2FkZWVzYW5AY29sbGVnZS5oYXJ2YXJkLmVkdSJ9","address":"mjagadeesan@college.harvard.edu","name":null,"avatar":null,"linkedin":null,"bio":null,"site":null,"override":null,"membership":[],"paper":[{"modelsAggregate":{"count":0}},{"modelsAggregate":{"count":0}},{"modelsAggregate":{"count":0}}],"github":[{"avatar":"https://avatars.githubusercontent.com/u/25335097?v=4","username":"mjagadeesan"}],"scholar":[{"thirdPartyID":"XW62DrcAAAAJ"}],"twitter":[],"location":[],"owner":[{"id":"eyJ1aWQiOiI2N2M2YmY1ZC0wZWI2LTQ0NzktOGNjNy1hZWU4MGRiMzE3ZDgifQ==","name":"Meena Jagadeesan","github":[],"email":[{"avatar":"https://img.fullcontact.com/static/30188c73a6a021694618c019d7cc9f82_56dd6e418bab53c917c71e27581e786a302cd0ea9b24c809ddf99e4b363790e1"}],"authored":[{"id":"eyJwYXBlcklEIjoiMjAwMy4xMzk2NiIsInB1Ymxpc2hlciI6ImFyeGl2In0=","publisher":"arxiv","paperID":"2003.13966"},{"id":"eyJwYXBlcklEIjoiMjQwMi4wNjYyNyIsInB1Ymxpc2hlciI6ImFyeGl2In0=","publisher":"arxiv","paperID":"2402.06627"},{"id":"eyJwYXBlcklEIjoiMTkwMy4wMzYwNSIsInB1Ymxpc2hlciI6ImFyeGl2In0=","publisher":"arxiv","paperID":"1903.03605"},{"id":"eyJwYXBlcklEIjoiMjEwMi4xMjIzOCIsInB1Ymxpc2hlciI6ImFyeGl2In0=","publisher":"arxiv","paperID":"2102.12238"},{"id":"eyJwYXBlcklEIjoiMTkwNi4wODczMiIsInB1Ymxpc2hlciI6ImFyeGl2In0=","publisher":"arxiv","paperID":"1906.08732"},{"id":"eyJwYXBlcklEIjoiMjEwNi4xMjcwNSIsInB1Ymxpc2hlciI6ImFyeGl2In0=","publisher":"arxiv","paperID":"2106.12705"},{"id":"eyJwYXBlcklEIjoiMjEwOC4wODg0MyIsInB1Ymxpc2hlciI6ImFyeGl2In0=","publisher":"arxiv","paperID":"2108.08843"},{"id":"eyJwYXBlcklEIjoiNTI4NTgiLCJwdWJsaXNoZXIiOiJuZXVyaXBzIn0=","publisher":"neurips","paperID":"52858"},{"id":"eyJwYXBlcklEIjoiNzA5MzgiLCJwdWJsaXNoZXIiOiJuZXVyaXBzIn0=","publisher":"neurips","paperID":"70938"},{"id":"eyJwYXBlcklEIjoiNzIxMDEiLCJwdWJsaXNoZXIiOiJuZXVyaXBzIn0=","publisher":"neurips","paperID":"72101"}]}]}}]},"__typename":"paper","authorArray":["Meena Jagadeesan"]}}],["$","$L18",null,{"container":true,"columns":100,"spacing":{"compact":0,"expanded":2,"large":3},"children":[["$","$L18",null,{"size":{"compact":100,"expanded":100,"large":68},"children":[["$","$7",null,{"children":["$","$L2c",null,{"publisher":"arxiv","paperID":"1903.03605","product":{"paper":"$1b:props:children:props:children:0:props:product","models":"$1b:props:children:props:children:0:props:product:models"},"isWhiteLabelled":false}]}],["$","$7",null,{"children":["$","$L2d",null,{"article":"$L2e","model":"$undefined"}]}]]}],["$","$L18",null,{"size":"grow","children":["$","$L2f",null,{}]}]]}],["$","$7",null,{"children":null}],[["$","audio",null,{"id":"tts"}],["$","$L30",null,{"paperID":"1903.03605","publisher":"arxiv","paperJSON":{"title":"Understanding Sparse JL for Feature Hashing","paperID":"1903.03605","avgLineHeight":11.97,"imgScale":4,"sections":[{"heading":"Abstract","paragraphs":[[{"text":"Feature hashing and other random projection schemes are commonly used to reduce the dimensionality of feature vectors. The goal is to efficiently project a high-dimensional feature vector living in ","element":"span"},{"style":{"height":10.5},"width":155.9,"height":26.24,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/0-0.png","element":"img","alt":" Rn into a","inline":true,"padRight":true},{"text":"much lower-dimensional space ","element":"span"},{"style":{"height":10.49},"width":51.9,"height":26.24,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/0-1.png","element":"img","alt":" Rm","inline":true},{"text":", while approximately preserving Euclidean norm. These schemes can be constructed using sparse random projections, for example using a sparse Johnson-Lindenstrauss (JL) transform. A line of work introduced by Weinberger et. al (ICML ’09) analyzes the accuracy of sparse JL with sparsity 1 on feature vectors with small ","element":"span"},{"style":{"height":10.79},"width":133.98,"height":26.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/0-2.png","element":"img","alt":" ℓ∞-to-ℓ2","inline":true,"padRight":true},{"text":"norm ratio. Recently, Freksen, Kamma, and Larsen (NeurIPS ’18) closed this line of work by proving a tight tradeoff between ","element":"span"},{"style":{"height":10.79},"width":133.98,"height":26.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/0-3.png","element":"img","alt":" ℓ∞-to-ℓ2","inline":true,"padRight":true},{"text":"norm ratio and accuracy for sparse JL with sparsity ","element":"span"},{"text":"1","element":"span"},{"text":".","element":"span"}],[{"text":"In this paper, we demonstrate the benefits of using sparsity ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"greater than ","element":"span"},{"text":"1 ","element":"span"},{"text":"in sparse JL on feature vectors. Our main result is a tight tradeoff between ","element":"span"},{"style":{"height":10.8},"width":133.98,"height":26.99,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/0-4.png","element":"img","alt":" ℓ∞-to-ℓ2","inline":true,"padRight":true},{"text":"norm ratio and accuracy for a general sparsity ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s","element":"span"},{"text":", that significantly generalizes the result of Freksen et. al. Our result theoretically demonstrates that sparse JL with ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s > ","element":"span"},{"text":"1 ","element":"span"},{"text":"can have significantly better norm-preservation properties on feature vectors than sparse JL with ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"= 1","element":"span"},{"text":"; we also empirically demonstrate this finding.","element":"span"}]]},{"heading":"1 Introduction","paragraphs":[[{"text":"Feature hashing and other random projection schemes are influential in helping manage large data ","element":"span"},{"href":"#id-0","referenceIndex":11,"text":"[11]","element":"a"},{"text":". The goal is to ","element":"span"},{"style":{"fontStyle":"italic"},"text":"reduce the dimensionality ","element":"span"},{"text":"of feature vectors: more specifically, to project high-dimensional feature vectors living in ","element":"span"},{"style":{"height":10.8},"width":48.78,"height":27,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/0-5.png","element":"img","alt":" Rn","inline":true,"padRight":true},{"text":"into a lower dimensional space ","element":"span"},{"style":{"height":10.8},"width":56.78,"height":27,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/0-6.png","element":"img","alt":" Rm","inline":true,"padRight":true},{"text":"(where ","element":"span"},{"style":{"height":10.4},"width":131.5,"height":26,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/0-7.png","element":"img","alt":" m ≪ n","inline":true},{"text":"), while approximately preserving Euclidean distances (i.e. ","element":"span"},{"style":{"height":7.6},"width":32.61,"height":19,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/0-8.png","element":"img","alt":" ℓ2","inline":true,"padRight":true},{"text":"distances) with high probability. This dimensionality reduction enables a classifier to process vectors in ","element":"span"},{"style":{"height":10.8},"width":56.78,"height":27,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/0-9.png","element":"img","alt":" Rm","inline":true},{"text":", instead of vectors in ","element":"span"},{"style":{"height":10.8},"width":48.78,"height":27,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/0-10.png","element":"img","alt":" Rn","inline":true},{"text":". In this context, feature hashing was first introduced by Weinberger et. al ","element":"span"},{"href":"#id-1","referenceIndex":29,"text":"[29] ","element":"a"},{"text":"for document-based classification tasks such as email spam filtering. For such tasks, feature hashing yields a lower dimensional embedding of a high-dimensional feature vector derived from a bag-of-words model. Since then, feature hashing has become a mainstream approach ","element":"span"},{"href":"#id-2","referenceIndex":28,"text":"[28]","element":"a"},{"text":", applied to numerous domains including ranking text documents ","element":"span"},{"href":"#id-3","referenceIndex":4,"text":"[4]","element":"a"},{"text":", compressing neural networks ","element":"span"},{"href":"#id-4","referenceIndex":7,"text":"[7]","element":"a"},{"text":", and protein sequence classification ","element":"span"},{"href":"#id-5","referenceIndex":5,"text":"[5]","element":"a"},{"text":".","element":"span"}],[{"style":{"fontWeight":"bold"},"text":"Random Projections","element":"span"}],[{"text":"Dimensionality reduction schemes for feature vectors fit nicely into the random projection literature. In fact, the feature hashing scheme proposed by Weinberger et al. ","element":"span"},{"href":"#id-1","referenceIndex":29,"text":"[29] ","element":"a"},{"text":"boils down to uniformly drawing a random ","element":"span"},{"style":{"height":8},"width":107.7,"height":20,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/0-11.png","element":"img","alt":"m × n","inline":true,"padRight":true},{"text":"matrix where each column contains ","element":"span"},{"style":{"fontStyle":"italic"},"text":"one ","element":"span"},{"text":"nonzero entry, equal to ","element":"span"},{"style":{"height":10.8},"width":51,"height":27,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/0-12.png","element":"img","alt":" −1","inline":true,"padRight":true},{"text":"or ","element":"span"},{"text":"1","element":"span"},{"text":".","element":"span"}],[{"text":"The ","element":"span"},{"style":{"height":7.6},"width":32.61,"height":19,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/0-13.png","element":"img","alt":" ℓ2","inline":true},{"text":"-norm-preserving objective can be expressed mathematically as follows: for error ","element":"span"},{"style":{"height":11.6},"width":94.26,"height":29,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/0-14.png","element":"img","alt":" ϵ > 0","inline":true,"padRight":true},{"text":"and failure probability ","element":"span"},{"style":{"height":11.6},"width":19,"height":29,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/0-15.png","element":"img","alt":" δ","inline":true},{"text":", the goal is to construct a probability distribution ","element":"span"},{"style":{"fontStyle":"italic"},"text":"A ","element":"span"},{"text":"over ","element":"span"},{"style":{"height":8},"width":108.93,"height":20,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/0-16.png","element":"img","alt":" m × n","inline":true,"padRight":true},{"text":"real matrices that satisfies the following condition for vectors ","element":"span"},{"style":{"height":11.6},"width":120.26,"height":29,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/0-17.png","element":"img","alt":" x ∈ Rn","inline":true},{"text":":","element":"span"}],[{"id":"id-6","style":{"width":"73%"},"width":1398,"height":42,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/0-18.png","element":"img"}],[{"text":"The result underlying the random projection literature is the Johnson-Lindenstrauss lemma, which gives an upper bound on the dimension ","element":"span"},{"style":{"fontStyle":"italic"},"text":"m ","element":"span"},{"text":"achievable by a probability distribution ","element":"span"},{"style":{"fontStyle":"italic"},"text":"A ","element":"span"},{"text":"satisfying ","element":"span"},{"href":"#id-6","text":"(1)","element":"a"},{"text":":","element":"span"}],[{"style":{"fontWeight":"bold"},"text":"Lemma 1.1 (Johnson-Lindenstrauss ","element":"span"},{"href":"#id-7","referenceIndex":16,"style":{"fontWeight":"bold"},"text":"[16]","element":"a"},{"style":{"fontWeight":"bold"},"text":") ","element":"span"},{"text":"For any ","element":"span"},{"style":{"height":11.6},"width":117.83,"height":29,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-0.png","element":"img","alt":" n ∈ N","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":16},"width":207.07,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-1.png","element":"img","alt":" ϵ, δ ∈ (0, 1)","inline":true},{"text":", there exists a probability distribution ","element":"span"},{"style":{"fontStyle":"italic"},"text":"A ","element":"span"},{"text":"over ","element":"span"},{"style":{"height":8},"width":107.69,"height":20,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-2.png","element":"img","alt":" m × n","inline":true,"padRight":true},{"text":"matrices, with ","element":"span"},{"style":{"height":17.38},"width":339.5,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-3.png","element":"img","alt":" m = Θ(ϵ−2 ln(1/δ))","inline":true},{"text":", that satisfies ","element":"span"},{"href":"#id-6","text":"(1)","element":"a"},{"text":".","element":"span"}],[{"text":"The optimality of the dimension ","element":"span"},{"style":{"fontStyle":"italic"},"text":"m ","element":"span"},{"text":"achieved by Lemma ","element":"span"},{"text":"1","element":"span"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"1 ","element":"span"},{"text":"has been proven ","element":"span"},{"href":"#id-8","referenceIndex":17,"text":"[17, ","element":"a"},{"href":"#id-9","referenceIndex":15,"text":"15]","element":"a"},{"text":".","element":"span"}],[{"text":"To speed up projection time, it is useful to consider probability distributions over sparse matrices (i.e. matrices with a small number of nonzero entries per column). More specifically, for matrices with ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"nonzero entries per column, the projection time for a vector ","element":"span"},{"style":{"fontStyle":"italic"},"text":"x ","element":"span"},{"text":"goes down from ","element":"span"},{"style":{"height":16.78},"width":185.14,"height":41.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-4.png","element":"img","alt":" O(m ∥x∥0)","inline":true,"padRight":true},{"text":"to ","element":"span"},{"style":{"height":16.78},"width":168.82,"height":41.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-5.png","element":"img","alt":" O(s ∥x∥0)","inline":true},{"text":", where ","element":"span"},{"style":{"height":16.78},"width":78.63,"height":41.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-6.png","element":"img","alt":" ∥x∥0","inline":true,"padRight":true},{"text":"is the number of nonzero entries of ","element":"span"},{"style":{"fontStyle":"italic"},"text":"x","element":"span"},{"text":". In this context, Kane and Nelson ","element":"span"},{"href":"#id-10","referenceIndex":19,"text":"[19] ","element":"a"},{"text":"constructed sparse JL distributions (which we define formally in Section ","element":"span"},{"href":"#id-11","text":"1.1)","element":"a"},{"text":", improving upon previous work ","element":"span"},{"href":"#id-12","referenceIndex":2,"text":"[2, ","element":"a"},{"href":"#id-13","referenceIndex":22,"text":"22, ","element":"a"},{"href":"#id-14","referenceIndex":12,"text":"12]","element":"a"},{"text":". Roughly speaking, a sparse JL distribution, as constructed in ","element":"span"},{"href":"#id-10","referenceIndex":19,"text":"[19]","element":"a"},{"text":", boils down to drawing a random ","element":"span"},{"style":{"height":8},"width":114.22,"height":20,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-7.png","element":"img","alt":" m × n","inline":true,"padRight":true},{"text":"matrix where each column contains exactly ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"nonzero entries, each equal to ","element":"span"},{"style":{"height":16.28},"width":123.05,"height":40.7,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-8.png","element":"img","alt":" −1/√s","inline":true,"padRight":true},{"text":"or ","element":"span"},{"style":{"height":16.28},"width":92.06,"height":40.7,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-9.png","element":"img","alt":" 1/√s","inline":true},{"text":". Kane and Nelson show that sparse JL distributions achieve the same (optimal) dimension as Lemma ","element":"span"},{"text":"1","element":"span"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"1","element":"span"},{"text":", while also satisfying a sparsity property.","element":"span"}],[{"id":"id-16","style":{"fontWeight":"bold"},"text":"Theorem 1.2 (Sparse JL ","element":"span"},{"href":"#id-10","referenceIndex":19,"style":{"fontWeight":"bold"},"text":"[19]","element":"a"},{"style":{"fontWeight":"bold"},"text":") ","element":"span"},{"text":"For any ","element":"span"},{"style":{"height":11.6},"width":101.63,"height":29,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-10.png","element":"img","alt":" n ∈ N","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":16},"width":190.87,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-11.png","element":"img","alt":" ϵ, δ ∈ (0, 1)","inline":true},{"text":", a sparse JL distribution ","element":"span"},{"style":{"height":16.39},"width":114.06,"height":40.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-12.png","element":"img","alt":" As,m,n","inline":true,"padRight":true},{"text":"(defined formally in Section ","element":"span"},{"href":"#id-11","text":"1.1) ","element":"a"},{"text":"over ","element":"span"},{"style":{"height":8},"width":99.78,"height":20,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-13.png","element":"img","alt":" m×n","inline":true,"padRight":true},{"text":"matrices, with dimension ","element":"span"},{"style":{"height":17.39},"width":339.5,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-14.png","element":"img","alt":" m = Θ(ϵ−2 ln(1/δ))","inline":true,"padRight":true},{"text":"and sparsity ","element":"span"},{"style":{"height":17.39},"width":323.18,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-15.png","element":"img","alt":" s = Θ(ϵ−1 ln(1/δ))","inline":true},{"text":", satisfies ","element":"span"},{"href":"#id-6","text":"(1)","element":"a"},{"text":".","element":"span"}],[{"text":"Sparse JL distributions are state-of-the-art sparse random projections, and achieve a sparsity that is nearly optimal when the dimension ","element":"span"},{"style":{"fontStyle":"italic"},"text":"m ","element":"span"},{"text":"is ","element":"span"},{"style":{"height":17.39},"width":277.93,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-16.png","element":"img","alt":" Θ(ϵ−2 ln(1/δ)).1","inline":true,"padRight":true},{"text":"However, in practice, it can be necessary to utilize a lower sparsity ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s","element":"span"},{"text":", since the projection time is linear in ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s","element":"span"},{"text":". Resolving this issue, Cohen ","element":"span"},{"href":"#id-15","referenceIndex":8,"text":"[8] ","element":"a"},{"text":"extended the upper bound in Theorem ","element":"span"},{"href":"#id-16","text":"1.2 ","element":"a"},{"text":"to show that sparse JL distributions can achieve a lower sparsity with an appropriate gain in dimension. He proved the following dimension-sparsity tradeoffs:","element":"span"}],[{"id":"id-17","style":{"fontWeight":"bold"},"text":"Theorem 1.3 (Dimension-Sparsity Tradeoffs ","element":"span"},{"href":"#id-15","referenceIndex":8,"style":{"fontWeight":"bold"},"text":"[8]","element":"a"},{"style":{"fontWeight":"bold"},"text":") ","element":"span"},{"text":"For any ","element":"span"},{"style":{"height":11.6},"width":107.4,"height":29,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-17.png","element":"img","alt":" n ∈ N","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":16},"width":196.65,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-18.png","element":"img","alt":" ϵ, δ ∈ (0, 1)","inline":true},{"text":", a uniform sparse JL distribution ","element":"span"},{"style":{"height":16.39},"width":114.05,"height":40.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-19.png","element":"img","alt":" As,m,n","inline":true,"padRight":true},{"text":"(defined formally in Section ","element":"span"},{"href":"#id-11","text":"1.1)","element":"a"},{"text":", with ","element":"span"},{"style":{"height":17.39},"width":323.18,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-20.png","element":"img","alt":" s ≤ Θ(ϵ−1 ln(1/δ))","inline":true,"padRight":true},{"text":"and","element":"span"}],[{"style":{"width":"42%"},"width":808,"height":73,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-21.png","element":"img"}],[{"text":"satisfies ","element":"span"},{"href":"#id-6","text":"(1)","element":"a"},{"text":".","element":"span"}],[{"style":{"fontWeight":"bold"},"text":"Connection to Feature Hashing","element":"span"}],[{"text":"Sparse JL distributions have particularly close ties to feature hashing. ","element":"span"},{"text":"In particular, the feature hashing scheme proposed by Weinberger et al. ","element":"span"},{"href":"#id-1","referenceIndex":29,"text":"[29] ","element":"a"},{"text":"can be viewed as a special case of sparse JL, namely with ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"= 1","element":"span"},{"text":". Interestingly, in practice, feature hashing can do much better than theoretical results, such as Theorem ","element":"span"},{"href":"#id-16","text":"1","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"2 ","element":"span"},{"text":"and Theorem ","element":"span"},{"href":"#id-17","text":"1","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"3","element":"span"},{"text":", would indicate ","element":"span"},{"href":"#id-18","referenceIndex":13,"text":"[13]","element":"a"},{"text":". An explanation for this phenomenon is that the highest error terms in sparse JL stem from vectors with mass concentrated on a very small number of entries, while in practice, the mass on feature vectors may be spread out between many coordinates. This motivates studying the tradeoff space for vectors with low ","element":"span"},{"style":{"height":5.2},"width":48.6,"height":13,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-22.png","element":"img","alt":" ℓ∞","inline":true},{"text":"-to-","element":"span"},{"style":{"height":7.6},"width":32.6,"height":19,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-23.png","element":"img","alt":"ℓ2","inline":true,"padRight":true},{"text":"ratio.","element":"span"}],[{"text":"More formally, take ","element":"span"},{"style":{"height":13.19},"width":40.44,"height":32.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-24.png","element":"img","alt":" Sv","inline":true,"padRight":true},{"text":"to be","element":"span"},{"style":{"height":29.2},"width":372.02,"height":73,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-25.png","element":"img","alt":"�x ∈ Rn | ∥x∥∞∥x∥2 ≤ v�","inline":true},{"text":", so that ","element":"span"},{"style":{"height":13.19},"width":154.08,"height":32.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-26.png","element":"img","alt":" S1 = Rn","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":14.4},"width":153.79,"height":36,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-27.png","element":"img","alt":" Sv ⊊ Sw","inline":true,"padRight":true},{"text":"for ","element":"span"},{"style":{"height":13.2},"width":279.22,"height":33,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-28.png","element":"img","alt":" 0 ≤ v < w ≤ 1","inline":true},{"text":". Let ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-29.png","element":"img","alt":" v(m, ϵ, δ, s)","inline":true,"padRight":true},{"text":"be the supremum over all ","element":"span"},{"style":{"height":13.2},"width":183.05,"height":33,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-30.png","element":"img","alt":" 0 ≤ v ≤ 1","inline":true,"padRight":true},{"text":"such that a sparse JL distribution with sparsity ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"and dimension ","element":"span"},{"style":{"fontStyle":"italic"},"text":"m ","element":"span"},{"text":"satisfies ","element":"span"},{"href":"#id-6","text":"(1) ","element":"a"},{"text":"for each ","element":"span"},{"style":{"height":13.19},"width":113.6,"height":32.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-31.png","element":"img","alt":" x ∈ Sv","inline":true},{"text":". (That is, ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-32.png","element":"img","alt":" v(m, ϵ, δ, s)","inline":true,"padRight":true},{"text":"is the maximum ","element":"span"},{"style":{"height":16},"width":150.77,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-33.png","element":"img","alt":" v ∈ [0, 1]","inline":true,"padRight":true},{"text":"such that for every ","element":"span"},{"style":{"height":11.6},"width":122.95,"height":29,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-34.png","element":"img","alt":"x ∈ Rn","inline":true},{"text":", if ","element":"span"},{"style":{"height":16.78},"width":258.22,"height":41.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-35.png","element":"img","alt":" ∥x∥∞ ≤ v ∥x∥2","inline":true,"padRight":true},{"text":"then ","element":"span"},{"href":"#id-6","text":"(1) ","element":"a"},{"text":"holds.","element":"span"},{"style":{"height":7.6},"width":16,"height":19,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-36.png","element":"img","alt":"2","inline":true},{"text":") For ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"= 1","element":"span"},{"text":", a line of work ","element":"span"},{"href":"#id-1","referenceIndex":29,"text":"[29, ","element":"a"},{"href":"#id-14","referenceIndex":12,"text":"12, ","element":"a"},{"href":"#id-19","referenceIndex":18,"text":"18, ","element":"a"},{"href":"#id-20","referenceIndex":10,"text":"10, ","element":"a"},{"href":"#id-10","referenceIndex":19,"text":"19] ","element":"a"},{"text":"improved bounds on ","element":"span"},{"style":{"height":16},"width":193.47,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-37.png","element":"img","alt":"v(m, ϵ, δ, 1)","inline":true},{"text":", and was recently closed by Freksen et al. ","element":"span"},{"href":"#id-18","referenceIndex":13,"text":"[13]","element":"a"},{"text":".","element":"span"}],[{"id":"id-21","style":{"fontWeight":"bold"},"text":"Theorem 1.4 (","element":"span"},{"href":"#id-18","referenceIndex":13,"style":{"fontWeight":"bold"},"text":"[13]","element":"a"},{"style":{"fontWeight":"bold"},"text":") ","element":"span"},{"text":"For any ","element":"span"},{"style":{"height":11.6},"width":123.08,"height":29,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-38.png","element":"img","alt":" m ∈ N","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":16},"width":201.26,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-39.png","element":"img","alt":" ϵ, δ ∈ (0, 1)","inline":true},{"text":", the function ","element":"span"},{"style":{"height":16},"width":193.47,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-40.png","element":"img","alt":" v(m, ϵ, δ, 1)","inline":true,"padRight":true},{"text":"is equal to ","element":"span"},{"style":{"height":16},"width":265.16,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-41.png","element":"img","alt":" f(m, ϵ, ln(1/δ))","inline":true,"padRight":true},{"text":"where:","element":"span"}],[{"style":{"width":"68%"},"width":1306,"height":214,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/1-42.png","element":"img"}],[{"style":{"fontWeight":"bold"},"text":"Generalizing to Sparse Random Projections with ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s > ","element":"span"},{"text":"1","element":"span"}],[{"text":"While Theorem ","element":"span"},{"href":"#id-21","text":"1","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"4 ","element":"span"},{"text":"is restricted to the case of ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"= 1","element":"span"},{"text":", dimensionality reduction schemes constructed using sparse random projections with sparsity ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s > ","element":"span"},{"text":"1 ","element":"span"},{"text":"have been used in practice for projecting feature vectors. For example, sparse JL-like methods (with ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s > ","element":"span"},{"text":"1","element":"span"},{"text":") have been used to project feature vectors in machine learning domains including visual tracking ","element":"span"},{"href":"#id-22","referenceIndex":27,"text":"[27]","element":"a"},{"text":", face recognition ","element":"span"},{"href":"#id-23","referenceIndex":23,"text":"[23]","element":"a"},{"text":", and recently in ELM ","element":"span"},{"href":"#id-24","referenceIndex":6,"text":"[6]","element":"a"},{"text":". Now, a variant of sparse JL is included in the Python sklearn library.","element":"span"},{"style":{"height":7.6},"width":16,"height":19,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-0.png","element":"img","alt":"3","inline":true}],[{"text":"In this context, it is natural to explore how constructions with ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s > ","element":"span"},{"text":"1 ","element":"span"},{"text":"perform on feature vectors, by studying ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-1.png","element":"img","alt":"v(m, ϵ, δ, s)","inline":true,"padRight":true},{"text":"for sparse JL with ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s > ","element":"span"},{"text":"1","element":"span"},{"text":". In fact, a related question was considered by Weinberger et al. ","element":"span"},{"href":"#id-1","referenceIndex":29,"text":"[29] ","element":"a"},{"text":"for “multiple hashing,” an alternate distribution over sparse matrices constructed by adding ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"draws from ","element":"span"},{"style":{"height":16.39},"width":114.9,"height":40.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-2.png","element":"img","alt":" A1,m,n","inline":true,"padRight":true},{"text":"and scaling by ","element":"span"},{"style":{"height":16.28},"width":92.06,"height":40.7,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-3.png","element":"img","alt":" 1/√s","inline":true},{"text":". More specifically, they show that ","element":"span"},{"style":{"height":16.28},"width":672.42,"height":40.7,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-4.png","element":"img","alt":" v(m, ϵ, δ, s) ≥ min(1, √s · v(m, ϵ, δ, 1))","inline":true,"padRight":true},{"text":"for multiple hashing. However, Kane and Nelson ","element":"span"},{"href":"#id-10","referenceIndex":19,"text":"[19] ","element":"a"},{"text":"later showed that multiple hashing has worse geometry-preserving properties than sparse JL: that is, multiple hashing requires a larger sparsity than sparse JL to satisfy ","element":"span"},{"href":"#id-6","text":"(1)","element":"a"},{"text":".","element":"span"}],[{"text":"Characterizing ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-5.png","element":"img","alt":" v(m, ϵ, δ, s)","inline":true,"padRight":true},{"text":"for sparse JL distributions, which are state-of-the-art, remained an open problem. In this work, we settle how ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-6.png","element":"img","alt":" v(m, ϵ, δ, s)","inline":true,"padRight":true},{"text":"behaves for sparse JL with a general sparsity ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s > ","element":"span"},{"text":"1","element":"span"},{"text":", giving tight bounds. Our theoretical result shows that sparse JL with ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s > ","element":"span"},{"text":"1","element":"span"},{"text":", even if ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"is a small constant, can achieve significantly better norm-preservation properties for feature vectors than sparse JL with ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"= 1","element":"span"},{"text":". Moreover, we empirically demonstrate this finding.","element":"span"}],[{"style":{"fontWeight":"bold"},"text":"Main Results","element":"span"}],[{"text":"We show the following tight bounds on ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-7.png","element":"img","alt":" v(m, ϵ, δ, s)","inline":true,"padRight":true},{"text":"for a general sparsity ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s","element":"span"},{"text":":","element":"span"}],[{"id":"id-25","style":{"fontWeight":"bold"},"text":"Theorem 1.5 ","element":"span"},{"text":"For any ","element":"span"},{"style":{"height":14},"width":159.33,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-8.png","element":"img","alt":" s, m ∈ N","inline":true,"padRight":true},{"text":"such that ","element":"span"},{"style":{"height":16},"width":155.96,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-9.png","element":"img","alt":" s ≤ m/e","inline":true},{"text":", consider a uniform sparse JL distribution (defined in Section ","element":"span"},{"href":"#id-11","text":"1.1) ","element":"a"},{"text":"with sparsity ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"and dimension ","element":"span"},{"style":{"height":13.38},"width":62.06,"height":33.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-10.png","element":"img","alt":" m.4","inline":true,"padRight":true},{"text":"If ","element":"span"},{"style":{"height":0},"width":20,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-11.png","element":"img","alt":" ϵ","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":11.6},"width":19,"height":29,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-12.png","element":"img","alt":" δ","inline":true,"padRight":true},{"text":"are small enough","element":"span"},{"style":{"height":7.6},"width":16,"height":19,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-13.png","element":"img","alt":"5","inline":true},{"text":", the function ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-14.png","element":"img","alt":" v(m, ϵ, δ, s)","inline":true,"padRight":true},{"text":"is equal","element":"span"}],[{"style":{"width":"91%"},"width":1758,"height":488,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-15.png","element":"img"}],[{"text":"Our main result, Theorem ","element":"span"},{"href":"#id-25","text":"1.5, ","element":"a"},{"text":"significantly generalizes Theorem ","element":"span"},{"href":"#id-16","text":"1.2, ","element":"a"},{"text":"Theorem ","element":"span"},{"href":"#id-17","text":"1.3, ","element":"a"},{"text":"and Theorem ","element":"span"},{"href":"#id-21","text":"1.4. ","element":"a"},{"text":"Notice our bound in Theorem ","element":"span"},{"href":"#id-25","text":"1.5 ","element":"a"},{"text":"has up to four regimes. ","element":"span"},{"text":"In the first regime, which occurs when ","element":"span"},{"style":{"height":12.8},"width":87.4,"height":32,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-16.png","element":"img","alt":" m ≥","inline":true},{"style":{"height":20.19},"width":780.33,"height":50.48,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-17.png","element":"img","alt":"min(2ϵ−2/δ, ϵ−2 ln(1/δ)eΘ(max(1,ln(1/δ)ϵ−1/s)))","inline":true},{"text":", Theorem ","element":"span"},{"href":"#id-25","text":"1.5 ","element":"a"},{"text":"shows ","element":"span"},{"style":{"height":16},"width":282.78,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-18.png","element":"img","alt":" v(m, ϵ, δ, s) = 1","inline":true},{"text":", so ","element":"span"},{"href":"#id-6","text":"(1) ","element":"a"},{"text":"holds on the full space ","element":"span"},{"style":{"height":10.8},"width":48.78,"height":27,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-19.png","element":"img","alt":" Rn","inline":true},{"text":". Notice this boundary on ","element":"span"},{"style":{"fontStyle":"italic"},"text":"m ","element":"span"},{"text":"occurs at the dimensionality-sparsity tradeoff in Theorem ","element":"span"},{"href":"#id-17","text":"1.3. ","element":"a"},{"text":"In the last regime, which occurs when ","element":"span"},{"style":{"height":17.39},"width":350.32,"height":43.47,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-20.png","element":"img","alt":" m ≤ Θ(ϵ−2 ln(1/δ))","inline":true},{"text":", Theorem ","element":"span"},{"href":"#id-25","text":"1.5 ","element":"a"},{"text":"shows that ","element":"span"},{"style":{"height":16},"width":275.69,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-21.png","element":"img","alt":" v(m, ϵ, δ, s) = 0","inline":true},{"text":", so there are vectors with arbitrarily small ","element":"span"},{"style":{"height":5.2},"width":48.61,"height":13,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-22.png","element":"img","alt":" ℓ∞","inline":true},{"text":"-to-","element":"span"},{"style":{"height":7.6},"width":32.6,"height":19,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-23.png","element":"img","alt":"ℓ2","inline":true,"padRight":true},{"text":"norm ratio where ","element":"span"},{"href":"#id-6","text":"(1) ","element":"a"},{"text":"does not hold. When ","element":"span"},{"style":{"height":17.38},"width":323.18,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-24.png","element":"img","alt":" s ≤ Θ(ϵ−1 ln(1/δ))","inline":true},{"text":", Theorem ","element":"span"},{"href":"#id-25","text":"1.5 ","element":"a"},{"text":"shows that up to two intermediate regimes exist. One of the regimes, ","element":"span"},{"style":{"height":28.8},"width":651.55,"height":72,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-25.png","element":"img","alt":" Θ(√ϵs min(ln( mϵp )/p,�ln( mϵ2p )/√p))","inline":true},{"text":", ","element":"span"},{"text":"matches the middle regime of ","element":"span"},{"style":{"height":16},"width":193.47,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-26.png","element":"img","alt":" v(m, ϵ, δ, 1)","inline":true,"padRight":true},{"text":"in Theorem ","element":"span"},{"href":"#id-21","text":"1.4 ","element":"a"},{"text":"with an extra factor of ","element":"span"},{"style":{"height":16},"width":52.21,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-27.png","element":"img","alt":"√s","inline":true},{"text":", much like the bound for multiple hashing in ","element":"span"},{"href":"#id-1","referenceIndex":29,"text":"[29] ","element":"a"},{"text":"that we mentioned previously. ","element":"span"},{"text":"However, unlike the multiple hashing bound, Theorem ","element":"span"},{"href":"#id-25","text":"1.5 ","element":"a"},{"text":"sometimes has another regime, ","element":"span"},{"style":{"height":28.8},"width":374.47,"height":72,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-28.png","element":"img","alt":" Θ(√ϵs�ln( mϵ2p )/√p)","inline":true},{"text":", which does not arise for ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"= 1 ","element":"span"},{"text":"(i.e. in ","element":"span"},{"text":"Theorem ","element":"span"},{"href":"#id-21","text":"1.4)","element":"a"},{"text":".","element":"span"},{"style":{"height":7.6},"width":16,"height":19,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-29.png","element":"img","alt":"7","inline":true,"padRight":true},{"text":"Intuitively, we expect this additional regime for sparse JL with ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"close to ","element":"span"},{"style":{"height":17.38},"width":251.37,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-30.png","element":"img","alt":" Θ(ϵ−1 ln(1/δ))","inline":true},{"text":": at ","element":"span"},{"style":{"height":17.38},"width":338.46,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-31.png","element":"img","alt":"s = Θ(ϵ−1 ln(1/δ))","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":17.38},"width":354.78,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-32.png","element":"img","alt":" m = Θ(ϵ−2 ln(1/δ))","inline":true},{"text":", Theorem ","element":"span"},{"href":"#id-16","text":"1","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"2 ","element":"span"},{"text":"tells us ","element":"span"},{"style":{"height":16},"width":280.16,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-33.png","element":"img","alt":" v(m, ϵ, δ, s) = 1","inline":true},{"text":", but if ","element":"span"},{"style":{"height":0},"width":20,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/2-34.png","element":"img","alt":" ϵ","inline":true,"padRight":true},{"text":"is a constant, then the branch ","element":"span"},{"style":{"height":28.8},"width":322.4,"height":72,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-0.png","element":"img","alt":" Θ(√ϵs ln�mϵp�/p)","inline":true,"padRight":true},{"text":"yields ","element":"span"},{"style":{"height":19.2},"width":265.47,"height":48,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-1.png","element":"img","alt":" Θ(1/�ln(1/δ))","inline":true},{"text":", while the branch ","element":"span"},{"style":{"height":28.8},"width":374.47,"height":72,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-2.png","element":"img","alt":" Θ(√ϵs�ln( mϵ2p )/√p)","inline":true,"padRight":true},{"text":"yields ","element":"span"},{"style":{"height":16},"width":82.43,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-3.png","element":"img","alt":" Θ(1)","inline":true},{"text":". ","element":"span"},{"text":"Thus, it is natural that the first branch disappears for large ","element":"span"},{"style":{"fontStyle":"italic"},"text":"m","element":"span"},{"text":".","element":"span"}],[{"text":"Our result elucidates that ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-4.png","element":"img","alt":" v(m, ϵ, δ, s)","inline":true,"padRight":true},{"text":"increases approximately as ","element":"span"},{"style":{"height":16},"width":52.21,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-5.png","element":"img","alt":"√s","inline":true},{"text":", thus providing insight into how even small constant increases in sparsity can be useful in practice. Another consequence of our result is a lower bound on dimension-sparsity tradeoffs (Corollary ","element":"span"},{"href":"#id-26","text":"A.1 ","element":"a"},{"text":"in Appendix ","element":"span"},{"text":"A) ","element":"span"},{"text":"that essentially matches the upper bound in Theorem ","element":"span"},{"href":"#id-17","text":"1.3. ","element":"a"},{"text":"Moreover, we require new techniques to prove Theorem ","element":"span"},{"href":"#id-25","text":"1.5, ","element":"a"},{"text":"for reasons that we discuss further in Section ","element":"span"},{"href":"#id-27","text":"1.2.","element":"a"}],[{"text":"We also empirically support our theoretical findings in Theorem ","element":"span"},{"href":"#id-25","text":"1.5. ","element":"a"},{"text":"First, we illustrate with real-world datasets the potential benefits of using small constants ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s > ","element":"span"},{"text":"1 ","element":"span"},{"text":"for sparse JL on feature vectors. We specifically show that ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"= ","element":"span"},{"style":{"fontStyle":"italic"},"text":"{","element":"span"},{"text":"4","element":"span"},{"style":{"fontStyle":"italic"},"text":", ","element":"span"},{"text":"8","element":"span"},{"style":{"fontStyle":"italic"},"text":", ","element":"span"},{"text":"16","element":"span"},{"style":{"fontStyle":"italic"},"text":"} ","element":"span"},{"text":"consistently outperforms ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"= 1 ","element":"span"},{"text":"in preserving the ","element":"span"},{"style":{"height":7.6},"width":32.6,"height":19,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-6.png","element":"img","alt":" ℓ2","inline":true,"padRight":true},{"text":"norm of each vector, and that there can be up to a ","element":"span"},{"style":{"fontStyle":"italic"},"text":"factor of ten ","element":"span"},{"text":"decrease in failure probability for ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"= 8","element":"span"},{"style":{"fontStyle":"italic"},"text":", ","element":"span"},{"text":"16 ","element":"span"},{"text":"in comparison to ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"= 1","element":"span"},{"text":". Second, we use synthetic data to illustrate phase transitions and other trends in Theorem ","element":"span"},{"href":"#id-25","text":"1.5. ","element":"a"},{"text":"More specifically, we empirically show that ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-7.png","element":"img","alt":" v(m, ϵ, δ, s)","inline":true,"padRight":true},{"text":"is not smooth, and that the middle regime(s) of ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-8.png","element":"img","alt":" v(m, ϵ, δ, s)","inline":true,"padRight":true},{"text":"increases with ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s","element":"span"},{"text":".","element":"span"}],[{"id":"id-11","style":{"fontWeight":"bold"},"text":"1.1 ","element":"span"},{"style":{"fontWeight":"bold"},"text":"Preliminaries","element":"span"}],[{"text":"Let ","element":"span"},{"style":{"height":16.39},"width":114.05,"height":40.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-9.png","element":"img","alt":" As,m,n","inline":true,"padRight":true},{"text":"be a ","element":"span"},{"style":{"fontWeight":"bold"},"text":"sparse JL distribution ","element":"span"},{"text":"if the entries of a matrix ","element":"span"},{"style":{"height":16.39},"width":195.5,"height":40.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-10.png","element":"img","alt":" A ∈ As,m,n","inline":true,"padRight":true},{"text":"are generated as follows. Let ","element":"span"},{"style":{"height":17.07},"width":307.73,"height":42.68,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-11.png","element":"img","alt":"Ar,i = ηr,iσr,i/√s","inline":true,"padRight":true},{"text":"where ","element":"span"},{"style":{"height":20.16},"width":262.68,"height":50.4,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-12.png","element":"img","alt":" {σr,i}r∈[m],i∈[n]","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":20.16},"width":259.7,"height":50.4,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-13.png","element":"img","alt":" {ηr,i}r∈[m],i∈[n]","inline":true,"padRight":true},{"text":"are defined as follows:","element":"span"}],[{"style":{"fontStyle":"italic"},"text":"• ","element":"span"},{"text":"The families ","element":"span"},{"style":{"height":20.16},"width":262.68,"height":50.4,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-14.png","element":"img","alt":" {σr,i}r∈[m],i∈[n]","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":20.16},"width":259.7,"height":50.4,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-15.png","element":"img","alt":" {ηr,i}r∈[m],i∈[n]","inline":true,"padRight":true},{"text":"are independent from each other.","element":"span"}],[{"style":{"fontStyle":"italic"},"text":"• ","element":"span"},{"text":"The variables ","element":"span"},{"style":{"height":20.16},"width":262.68,"height":50.39,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-16.png","element":"img","alt":" {σr,i}r∈[m],i∈[n]","inline":true,"padRight":true},{"text":"are i.i.d Rademachers (","element":"span"},{"style":{"height":10.8},"width":51,"height":27,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-17.png","element":"img","alt":"±1","inline":true,"padRight":true},{"text":"coin flips).","element":"span"}],[{"style":{"fontStyle":"italic"},"text":"• ","element":"span"},{"text":"The variables ","element":"span"},{"style":{"height":20.16},"width":259.7,"height":50.39,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-18.png","element":"img","alt":" {ηr,i}r∈[m],i∈[n]","inline":true,"padRight":true},{"text":"are identically distributed Bernoullis (","element":"span"},{"style":{"fontStyle":"italic"},"text":"{","element":"span"},{"text":"0","element":"span"},{"style":{"fontStyle":"italic"},"text":", ","element":"span"},{"text":"1","element":"span"},{"style":{"fontStyle":"italic"},"text":"} ","element":"span"},{"text":"random variables) with expectation ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s/m","element":"span"},{"text":".","element":"span"}],[{"style":{"fontStyle":"italic"},"text":"• ","element":"span"},{"text":"The ","element":"span"},{"style":{"height":20.16},"width":259.7,"height":50.4,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-19.png","element":"img","alt":" {ηr,i}r∈[m],i∈[n]","inline":true,"padRight":true},{"text":"are independent across columns but not independent within each column. For every column ","element":"span"},{"style":{"height":13.2},"width":163.92,"height":33,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-20.png","element":"img","alt":" 1 ≤ i ≤ n","inline":true},{"text":", it holds that ","element":"span"},{"style":{"height":17.61},"width":235.3,"height":44.02,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-21.png","element":"img","alt":"�mr=1 ηr,i = s","inline":true},{"text":". Moreover, the random variables are ","element":"span"},{"style":{"fontStyle":"italic"},"text":"negatively correlated","element":"span"},{"text":": ","element":"span"},{"text":"for every subset ","element":"span"},{"style":{"height":16},"width":136.92,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-22.png","element":"img","alt":" S ⊆ [m]","inline":true,"padRight":true},{"text":"and every column ","element":"span"},{"style":{"height":13.2},"width":163.92,"height":33,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-23.png","element":"img","alt":" 1 ≤ i ≤ n","inline":true},{"text":", it holds that ","element":"span"},{"style":{"height":19.29},"width":490.09,"height":48.23,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-24.png","element":"img","alt":" E��r∈S ηr,i�≤ �r∈S E[ηr,i]","inline":true},{"text":".","element":"span"}],[{"text":"A common special case is a ","element":"span"},{"style":{"fontWeight":"bold"},"text":"uniform sparse JL distribution","element":"span"},{"text":", generated as follows: for every ","element":"span"},{"style":{"height":13.2},"width":166,"height":33,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-25.png","element":"img","alt":" 1 ≤ i ≤ n","inline":true},{"text":", we ","element":"span"},{"style":{"fontStyle":"italic"},"text":"uniformly ","element":"span"},{"text":"choose exactly ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"of these variables in ","element":"span"},{"style":{"height":20.16},"width":179.74,"height":50.4,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-26.png","element":"img","alt":" {ηr,i}r∈[m]","inline":true,"padRight":true},{"text":"to be ","element":"span"},{"text":"1","element":"span"},{"text":". When ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"= 1","element":"span"},{"text":", every sparse JL distribution is a uniform sparse JL distribution, but for ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s > ","element":"span"},{"text":"1","element":"span"},{"text":", this is not the case.","element":"span"}],[{"text":"Another common special case is a ","element":"span"},{"style":{"fontWeight":"bold"},"text":"block sparse JL distribution","element":"span"},{"text":". This produces a different construction for ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s > ","element":"span"},{"text":"1","element":"span"},{"text":". In this distribution, each column ","element":"span"},{"style":{"height":13.2},"width":164,"height":33,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-27.png","element":"img","alt":" 1 ≤ i ≤ n","inline":true,"padRight":true},{"text":"is partitioned into ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"blocks of","element":"span"},{"style":{"height":19.21},"width":75.66,"height":48.02,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-28.png","element":"img","alt":"� ms�","inline":true},{"text":"consecutive rows. In each block in each column, the distribution of the variables ","element":"span"},{"style":{"height":16.79},"width":96.38,"height":41.97,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-29.png","element":"img","alt":" {ηr,i}","inline":true,"padRight":true},{"text":"is defined by uniformly choosing ","element":"span"},{"style":{"fontStyle":"italic"},"text":"exactly one ","element":"span"},{"text":"of these variables to be ","element":"span"},{"style":{"height":13.38},"width":46.99,"height":33.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-30.png","element":"img","alt":" 1.8","inline":true}],[{"id":"id-27","style":{"fontWeight":"bold"},"text":"1.2 ","element":"span"},{"style":{"fontWeight":"bold"},"text":"Proof Techniques","element":"span"}],[{"text":"We use the following notation. For any random variable ","element":"span"},{"style":{"fontStyle":"italic"},"text":"X ","element":"span"},{"text":"and value ","element":"span"},{"style":{"height":14},"width":96.1,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-31.png","element":"img","alt":" q ≥ 1","inline":true},{"text":", we call ","element":"span"},{"style":{"height":16},"width":124.52,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-32.png","element":"img","alt":" E[|X|q]","inline":true,"padRight":true},{"text":"the ","element":"span"},{"style":{"fontStyle":"italic"},"text":"q","element":"span"},{"text":"th ","element":"span"},{"style":{"fontStyle":"italic"},"text":"moment ","element":"span"},{"text":"of ","element":"span"},{"style":{"fontStyle":"italic"},"text":"X","element":"span"},{"text":", where ","element":"span"},{"text":"E ","element":"span"},{"text":"denotes the expectation. We use ","element":"span"},{"style":{"height":19.18},"width":90.99,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-33.png","element":"img","alt":" ∥X∥q","inline":true,"padRight":true},{"text":"to denote the ","element":"span"},{"style":{"fontStyle":"italic"},"text":"q","element":"span"},{"text":"-norm ","element":"span"},{"style":{"height":20.41},"width":202.79,"height":51.03,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-34.png","element":"img","alt":" (E[|X|q])1/q","inline":true},{"text":".","element":"span"}],[{"text":"For every ","element":"span"},{"style":{"height":16},"width":293.3,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-35.png","element":"img","alt":" [x1, . . . , xn] ∈ Rn","inline":true,"padRight":true},{"text":"such that ","element":"span"},{"style":{"height":16.78},"width":153.66,"height":41.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-36.png","element":"img","alt":" ∥x∥2 = 1","inline":true},{"text":", we need to analyze tail bounds of an error term, which for the sparse JL construction is the following random variable:","element":"span"}],[{"style":{"width":"53%"},"width":1014,"height":116,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-37.png","element":"img"}],[{"text":"An upper bound on the tail probability of ","element":"span"},{"style":{"height":16},"width":235.74,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-38.png","element":"img","alt":" R(x1, . . . , xn)","inline":true,"padRight":true},{"text":"is needed to prove the lower bound on ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-39.png","element":"img","alt":" v(m, ϵ, δ, s)","inline":true,"padRight":true},{"text":"in Theorem ","element":"span"},{"href":"#id-25","text":"1.5, ","element":"a"},{"text":"and a lower bound is needed to prove the upper bound on ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-40.png","element":"img","alt":" v(m, ϵ, δ, s)","inline":true,"padRight":true},{"text":"in Theorem ","element":"span"},{"href":"#id-25","text":"1.5. ","element":"a"},{"text":"It turns out that it suffices to tightly analyze the random variable moments ","element":"span"},{"style":{"height":16},"width":332.47,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/3-41.png","element":"img","alt":" E[(R(x1, . . . , xn))q]","inline":true},{"text":". For the upper bound, we use Markov’s inequality like in ","element":"span"},{"href":"#id-18","referenceIndex":13,"text":"[13, ","element":"a"},{"href":"#id-10","referenceIndex":19,"text":"19, ","element":"a"},{"href":"#id-28","referenceIndex":3,"text":"3, ","element":"a"},{"href":"#id-29","referenceIndex":24,"text":"24]","element":"a"},{"text":", and for the lower bound, we use the Paley-Zygmund inequality like in ","element":"span"},{"href":"#id-18","referenceIndex":13,"text":"[13]","element":"a"},{"text":": Markov’s inequality gives a tail upper bound from upper bounds on moments, and the Paley-Zygmund inequality gives a tail lower bound from upper and lower bounds on moments. Thus, the key ingredient of our analysis is a ","element":"span"},{"style":{"fontStyle":"italic"},"text":"tight bound ","element":"span"},{"text":"for ","element":"span"},{"style":{"height":19.18},"width":290.08,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-0.png","element":"img","alt":" ∥R(x1, . . . , xn)∥q","inline":true,"padRight":true},{"text":"on ","element":"span"},{"style":{"height":29.2},"width":602.74,"height":73,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-1.png","element":"img","alt":" Sv =�x ∈ Rn | ∥x∥∞∥x∥2 ≤ v�at each","inline":true,"padRight":true},{"text":"threshold ","element":"span"},{"style":{"fontStyle":"italic"},"text":"v ","element":"span"},{"text":"value.","element":"span"}],[{"text":"While the moments of ","element":"span"},{"style":{"height":16},"width":235.74,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-2.png","element":"img","alt":" R(x1, . . . , xn)","inline":true,"padRight":true},{"text":"have been studied in previous analyses of sparse JL, we emphasize that it is not clear how to adapt these existing approaches to obtain a tight bound on every ","element":"span"},{"style":{"height":13.19},"width":40.44,"height":32.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-3.png","element":"img","alt":" Sv","inline":true},{"text":". The moment bound that we require and obtain is far more general: the bounds in ","element":"span"},{"href":"#id-10","referenceIndex":19,"text":"[19, ","element":"a"},{"href":"#id-30","referenceIndex":9,"text":"9] ","element":"a"},{"text":"are limited to ","element":"span"},{"style":{"height":13.19},"width":149.52,"height":32.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-4.png","element":"img","alt":" Rn = S1","inline":true,"padRight":true},{"text":"and the bound in ","element":"span"},{"href":"#id-18","referenceIndex":13,"text":"[13] ","element":"a"},{"text":"is limited to ","element":"span"},{"style":{"height":13.38},"width":124.78,"height":33.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-5.png","element":"img","alt":" s = 1.9","inline":true,"padRight":true},{"text":"The non-combinatorial approach in ","element":"span"},{"href":"#id-30","referenceIndex":9,"text":"[9] ","element":"a"},{"text":"for bounding ","element":"span"},{"style":{"height":19.18},"width":290.09,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-6.png","element":"img","alt":" ∥R(x1, . . . , xn)∥q","inline":true,"padRight":true},{"text":"on ","element":"span"},{"style":{"height":13.19},"width":144.04,"height":32.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-7.png","element":"img","alt":"Rn = S1","inline":true,"padRight":true},{"text":"also turns out to not be sufficiently precise on ","element":"span"},{"style":{"height":13.19},"width":40.44,"height":32.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-8.png","element":"img","alt":" Sv","inline":true},{"text":", for reasons we discuss in Section ","element":"span"},{"text":"2.","element":"span"},{"style":{"height":7.6},"width":31.87,"height":19,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-9.png","element":"img","alt":"10","inline":true}],[{"text":"Thus, we require new tools for our moment bound. Our analysis provides a new perspective, inspired by the probability theory literature, that differs from the existing approaches in the JL literature. We believe our style of analysis is less brittle than combinatorial approaches ","element":"span"},{"href":"#id-18","referenceIndex":13,"text":"[13, ","element":"a"},{"href":"#id-10","referenceIndex":19,"text":"19, ","element":"a"},{"href":"#id-28","referenceIndex":3,"text":"3, ","element":"a"},{"href":"#id-29","referenceIndex":24,"text":"24]","element":"a"},{"text":": in this setting, once the sparsity ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"= 1 ","element":"span"},{"text":"case is recovered, it becomes straightforward to generalize to other ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"values. Moreover, our approach can yield greater precision than the existing non-combinatorial approaches ","element":"span"},{"href":"#id-30","referenceIndex":9,"text":"[9, ","element":"a"},{"href":"#id-15","referenceIndex":8,"text":"8, ","element":"a"},{"href":"#id-31","referenceIndex":14,"text":"14]","element":"a"},{"text":", which is necessary for this setting. Thus, we believe that our ","element":"span"},{"style":{"fontStyle":"italic"},"text":"structural ","element":"span"},{"text":"approach to analyzing JL distributions could be of use in other settings.","element":"span"}],[{"text":"In Section ","element":"span"},{"text":"2, ","element":"span"},{"text":"we present an overview of our methods and the key technical lemmas to analyze ","element":"span"},{"style":{"height":19.18},"width":290.09,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-10.png","element":"img","alt":" ∥R(x1, . . . , xn)∥q","inline":true},{"text":". We defer the proofs to the Appendix. In Section ","element":"span"},{"text":"3, ","element":"span"},{"text":"we prove the tail bounds in Theorem ","element":"span"},{"text":"1","element":"span"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"href":"#id-25","text":"5 ","element":"a"},{"text":"from these moment bounds. In Section ","element":"span"},{"text":"4, ","element":"span"},{"text":"we empirically evaluate sparse JL.","element":"span"}]]},{"heading":"2 Sketch of Bounding the Moments of R(x1, . . . , xn)","paragraphs":[[{"text":"Our approach takes advantage of the structure of ","element":"span"},{"style":{"height":16},"width":235.74,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-11.png","element":"img","alt":" R(x1, . . . , xn)","inline":true,"padRight":true},{"text":"as a quadratic form of Rademachers (i.e. ","element":"span"},{"style":{"height":19.14},"width":304.22,"height":47.84,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-12.png","element":"img","alt":"�t1,t2 at1,t2σt1σt2","inline":true},{"text":") with random variable coefficients (i.e. where ","element":"span"},{"style":{"height":11.59},"width":84.16,"height":28.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-13.png","element":"img","alt":" at1,t2","inline":true,"padRight":true},{"text":"is itself a random variable). For the ","element":"span"},{"text":"upper bound, we need to analyze ","element":"span"},{"style":{"height":19.18},"width":290.09,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-14.png","element":"img","alt":" ∥R(x1, . . . , xn)∥q","inline":true,"padRight":true},{"text":"for general vectors ","element":"span"},{"style":{"height":16},"width":195.75,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-15.png","element":"img","alt":" [x1, . . . , xn]","inline":true},{"text":". For the lower bound, we only need to show ","element":"span"},{"style":{"height":19.18},"width":290.09,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-16.png","element":"img","alt":" ∥R(x1, . . . , xn)∥q","inline":true,"padRight":true},{"text":"is large for single vector in each ","element":"span"},{"style":{"height":13.19},"width":40.44,"height":32.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-17.png","element":"img","alt":" Sv","inline":true},{"text":", and we show we can select the vector in the ","element":"span"},{"style":{"height":7.6},"width":32.6,"height":19,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-18.png","element":"img","alt":" ℓ2","inline":true},{"text":"-unit ball with ","element":"span"},{"style":{"height":17.39},"width":76.6,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-19.png","element":"img","alt":" 1/v2","inline":true,"padRight":true},{"text":"nonzero entries, all equal to ","element":"span"},{"style":{"fontStyle":"italic"},"text":"v","element":"span"},{"text":". For ease of notation, we denote this vector by ","element":"span"},{"text":"[","element":"span"},{"style":{"fontStyle":"italic"},"text":"v, . . . , v, ","element":"span"},{"text":"0","element":"span"},{"style":{"fontStyle":"italic"},"text":", . . . , ","element":"span"},{"text":"0] ","element":"span"},{"text":"for the remainder of the paper.","element":"span"}],[{"text":"We analyze ","element":"span"},{"style":{"height":19.18},"width":290.09,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-20.png","element":"img","alt":" ∥R(x1, . . . , xn)∥q","inline":true,"padRight":true},{"text":"using general moment bounds for Rademacher linear and quadratic forms. Though Cohen, Jayram, and Nelson ","element":"span"},{"href":"#id-30","referenceIndex":9,"text":"[9] ","element":"a"},{"text":"also view ","element":"span"},{"style":{"height":16},"width":235.74,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-21.png","element":"img","alt":" R(x1, . . . , xn)","inline":true,"padRight":true},{"text":"as a quadratic form, we show in Appendix ","element":"span"},{"text":"B ","element":"span"},{"text":"that their approach of bounding the Rademachers by gaussians is not sufficiently precise for our setting.","element":"span"},{"style":{"height":7.6},"width":31.87,"height":19,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-22.png","element":"img","alt":"11","inline":true}],[{"text":"In our approach, we make use of stronger moment bounds for Rademacher linear and quadratic forms, some of which are known to the probability theory community through Latała’s work in ","element":"span"},{"href":"#id-32","referenceIndex":21,"text":"[21, ","element":"a"},{"href":"#id-33","referenceIndex":20,"text":"20] ","element":"a"},{"text":"and some of which are new adaptions tailored to the constraints arising in our setting. More specifically, Latała’s bounds ","element":"span"},{"href":"#id-32","referenceIndex":21,"text":"[21, ","element":"a"},{"href":"#id-33","referenceIndex":20,"text":"20] ","element":"a"},{"text":"target the setting where the coefficients are scalars. In our setting, however, the coefficients are themselves random variables, and we need bounds that are ","element":"span"},{"style":{"fontStyle":"italic"},"text":"tractable ","element":"span"},{"text":"to analyze in this setting, which involves creating new bounds to handle some cases.","element":"span"}],[{"text":"Our strategy for bounding ","element":"span"},{"style":{"height":19.18},"width":290.09,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-23.png","element":"img","alt":" ∥R(x1, . . . , xn)∥q","inline":true,"padRight":true},{"text":"is to break down into rows. We define","element":"span"}],[{"style":{"width":"40%"},"width":765,"height":93,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-24.png","element":"img"}],[{"text":"so that ","element":"span"},{"style":{"height":19.37},"width":677.19,"height":48.43,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-25.png","element":"img","alt":" R(x1, . . . , xn) = 1s�mr=1 Zr(x1, . . . , xn)","inline":true},{"text":". We analyze the moments of ","element":"span"},{"style":{"height":16},"width":250.02,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-26.png","element":"img","alt":" Zr(x1, . . . , xn)","inline":true},{"text":", and then combine ","element":"span"},{"text":"these bounds to obtain moment bounds for ","element":"span"},{"style":{"height":16},"width":235.74,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-27.png","element":"img","alt":" R(x1, . . . , xn)","inline":true},{"text":". In our bounds, we use the notation ","element":"span"},{"style":{"height":15.2},"width":103.27,"height":38,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-28.png","element":"img","alt":" f ≲ g","inline":true,"padRight":true},{"text":"(resp. ","element":"span"},{"style":{"height":15.2},"width":95.94,"height":38,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-29.png","element":"img","alt":"f ≳ g","inline":true},{"text":") to denote ","element":"span"},{"style":{"height":14},"width":127.3,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-30.png","element":"img","alt":" f ≤ Cg","inline":true,"padRight":true},{"text":"(resp. ","element":"span"},{"style":{"height":14},"width":127.3,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/4-31.png","element":"img","alt":" f ≥ Cg","inline":true},{"text":") for some constant ","element":"span"},{"style":{"fontStyle":"italic"},"text":"C > ","element":"span"},{"text":"0","element":"span"},{"text":".","element":"span"}],[{"style":{"fontWeight":"bold"},"text":"2.1 ","element":"span"},{"style":{"fontWeight":"bold"},"text":"Bounding ","element":"span"},{"style":{"fontStyle":"italic"},"text":"∥","element":"span"},{"style":{"fontStyle":"italic"},"text":"Z","element":"span"},{"style":{"fontStyle":"italic"},"text":"r","element":"span"},{"text":"(","element":"span"},{"style":{"fontStyle":"italic"},"text":"x","element":"span"},{"text":"1","element":"span"},{"style":{"fontStyle":"italic"},"text":", . . . , x","element":"span"},{"style":{"fontStyle":"italic"},"text":"n","element":"span"},{"text":")","element":"span"},{"style":{"fontStyle":"italic"},"text":"∥","element":"span"},{"style":{"fontStyle":"italic"},"text":"q","element":"span"}],[{"text":"We show the following bounds on ","element":"span"},{"style":{"height":19.18},"width":304.37,"height":47.95,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-0.png","element":"img","alt":" ∥Zr(x1, . . . , xn)∥q","inline":true},{"text":". For the lower bound, as we discussed before, it suffices to bound ","element":"span"},{"style":{"height":19.18},"width":406.86,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-1.png","element":"img","alt":" ∥Zr(v, . . . , v, 0, . . . , 0)∥q","inline":true},{"text":". For the upper bound, we need to bound ","element":"span"},{"style":{"height":19.18},"width":304.37,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-2.png","element":"img","alt":" ∥Zr(x1, . . . , xn)∥q","inline":true,"padRight":true},{"text":"for general vectors as a function of the ","element":"span"},{"style":{"height":5.2},"width":48.6,"height":13,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-3.png","element":"img","alt":" ℓ∞","inline":true},{"text":"-to-","element":"span"},{"style":{"height":7.6},"width":32.6,"height":19,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-4.png","element":"img","alt":"ℓ2","inline":true,"padRight":true},{"text":"norm ratio.","element":"span"}],[{"id":"id-34","style":{"fontWeight":"bold"},"text":"Lemma 2.1 ","element":"span"},{"text":"Let ","element":"span"},{"style":{"height":16.39},"width":114.05,"height":40.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-5.png","element":"img","alt":" As,m,n","inline":true,"padRight":true},{"text":"be a sparse JL distribution such that ","element":"span"},{"style":{"height":16},"width":145.73,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-6.png","element":"img","alt":" s ≤ m/e","inline":true},{"text":". Suppose that ","element":"span"},{"style":{"height":16},"width":271.66,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-7.png","element":"img","alt":" x = [x1, . . . , xn]","inline":true,"padRight":true},{"text":"satisfies ","element":"span"},{"style":{"height":16.78},"width":168.52,"height":41.95,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-8.png","element":"img","alt":"∥x∥∞ ≤ v","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":16.78},"width":153.66,"height":41.95,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-9.png","element":"img","alt":" ∥x∥2 = 1","inline":true},{"text":". If ","element":"span"},{"style":{"fontStyle":"italic"},"text":"T ","element":"span"},{"text":"is even, then:","element":"span"}],[{"style":{"width":"80%"},"width":1533,"height":192,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-10.png","element":"img"}],[{"id":"id-35","style":{"fontWeight":"bold"},"text":"Lemma 2.2 ","element":"span"},{"text":"Let ","element":"span"},{"style":{"height":16.39},"width":114.06,"height":40.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-11.png","element":"img","alt":" As,m,n","inline":true,"padRight":true},{"text":"be a sparse JL distribution. Suppose ","element":"span"},{"style":{"height":19.37},"width":30.94,"height":48.43,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-12.png","element":"img","alt":"1v2","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"fontStyle":"italic"},"text":"T ","element":"span"},{"text":"are even integers. ","element":"span"},{"text":"Then, ","element":"span"},{"style":{"height":17.5},"width":495.66,"height":43.74,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-13.png","element":"img","alt":" ∥Zr(v, . . . , v, 0, . . . , 0)∥2 ≳ sm","inline":true},{"text":". Moreover, if ","element":"span"},{"style":{"height":16},"width":145.73,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-14.png","element":"img","alt":" s ≤ m/e","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":16.57},"width":145.96,"height":41.43,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-15.png","element":"img","alt":" T ≥ semv2","inline":true,"padRight":true},{"text":", then","element":"span"}],[{"style":{"width":"49%"},"width":941,"height":88,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-16.png","element":"img"}],[{"text":"and","element":"span"}],[{"style":{"width":"75%"},"width":1446,"height":130,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-17.png","element":"img"}],[{"text":"We now sketch our methods to prove Lemma ","element":"span"},{"href":"#id-34","text":"2.1 ","element":"a"},{"text":"and Lemma ","element":"span"},{"href":"#id-35","text":"2.2. ","element":"a"},{"text":"For the lower bound (Lemma ","element":"span"},{"href":"#id-35","text":"2.2)","element":"a"},{"text":", we can view ","element":"span"},{"style":{"height":16},"width":352.52,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-18.png","element":"img","alt":" Zr(v, . . . , v, 0, . . . , 0)","inline":true,"padRight":true},{"text":"as a quadratic form ","element":"span"},{"style":{"height":19.14},"width":304.22,"height":47.84,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-19.png","element":"img","alt":"�t1,t2 at1,t2σt1σt2","inline":true,"padRight":true},{"text":"where ","element":"span"},{"style":{"height":17.68},"width":270.82,"height":44.2,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-20.png","element":"img","alt":" (at1,t2)t1,t2∈[mn]","inline":true,"padRight":true},{"text":"is an ap- ","element":"span"},{"text":"propriately defined block-diagonal ","element":"span"},{"style":{"fontStyle":"italic"},"text":"mn ","element":"span"},{"text":"dimensional matrix. ","element":"span"},{"text":"We can write ","element":"span"},{"style":{"height":16.79},"width":495.86,"height":41.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-21.png","element":"img","alt":" Eσ,η[(Zr(v, . . . , v, 0, . . . , 0))q]","inline":true,"padRight":true},{"text":"as ","element":"span"},{"style":{"height":16.79},"width":545.47,"height":41.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-22.png","element":"img","alt":"Eη [Eσ[(Zr(v, . . . , v, 0, . . . , 0))q]]","inline":true},{"text":": for ","element":"span"},{"style":{"height":15.99},"width":153.67,"height":39.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-23.png","element":"img","alt":" fixed ηr,i","inline":true,"padRight":true},{"text":"values, the coefficients are scalars. We make use of Latała’s tight bound on Rademacher quadratic forms with scalar coefficients ","element":"span"},{"href":"#id-32","referenceIndex":21,"text":"[21] ","element":"a"},{"text":"to analyze ","element":"span"},{"style":{"height":16},"width":470.7,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-24.png","element":"img","alt":" Eσ[(Zr(v, . . . , v, 0, . . . , 0))q]","inline":true,"padRight":true},{"text":"as a function of the ","element":"span"},{"style":{"height":11.59},"width":54.17,"height":28.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-25.png","element":"img","alt":" ηr,i","inline":true},{"text":". Then, we handle the randomness of the ","element":"span"},{"style":{"height":11.59},"width":54.16,"height":28.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-26.png","element":"img","alt":" ηr,i","inline":true,"padRight":true},{"text":"by taking an expectation of the resulting bound on ","element":"span"},{"style":{"height":16},"width":470.7,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-27.png","element":"img","alt":" Eσ[(Zr(v, . . . , v, 0, . . . , 0))q]","inline":true,"padRight":true},{"text":"over the ","element":"span"},{"style":{"height":11.59},"width":54.16,"height":28.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-28.png","element":"img","alt":" ηr,i","inline":true,"padRight":true},{"text":"values to obtain a bound on ","element":"span"},{"style":{"height":19.18},"width":406.86,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-29.png","element":"img","alt":" ∥Zr(v, . . . , v, 0, . . . , 0)∥q","inline":true},{"text":".","element":"span"}],[{"text":"For the upper bound (Lemma ","element":"span"},{"href":"#id-34","text":"2.1)","element":"a"},{"text":", since Latała’s bound ","element":"span"},{"href":"#id-32","referenceIndex":21,"text":"[21] ","element":"a"},{"text":"is tight for scalar quadratic forms, the natural approach would be to use it to upper bound ","element":"span"},{"style":{"height":16},"width":368.21,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-30.png","element":"img","alt":" Eσ[(Zr(x1, . . . , xn))q]","inline":true,"padRight":true},{"text":"for general vectors. However, when the vector is not of the form ","element":"span"},{"text":"[","element":"span"},{"style":{"fontStyle":"italic"},"text":"v, . . . , v, ","element":"span"},{"text":"0","element":"span"},{"style":{"fontStyle":"italic"},"text":", . . . , ","element":"span"},{"text":"0]","element":"span"},{"text":", the asymmetry makes the resulting bound intractable to simplify. Specifically, there is a term, which can be viewed as a generalization of an operator norm to an ","element":"span"},{"style":{"height":7.6},"width":32.6,"height":19,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-31.png","element":"img","alt":" ℓ2","inline":true,"padRight":true},{"text":"ball cut out by ","element":"span"},{"style":{"height":5.2},"width":48.6,"height":13,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-32.png","element":"img","alt":" ℓ∞","inline":true,"padRight":true},{"text":"hyperplanes, that becomes problematic when taking an expectation over the ","element":"span"},{"style":{"height":11.59},"width":54.16,"height":28.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-33.png","element":"img","alt":" ηr,i","inline":true,"padRight":true},{"text":"to obtain a bound on ","element":"span"},{"style":{"height":16.79},"width":393.38,"height":41.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-34.png","element":"img","alt":"Eσ,η[(Zr(x1, . . . , xn))q]","inline":true},{"text":". Thus, we construct simpler estimates that avoid these complications while remaining sufficiently precise for our setting. These estimates take advantage of the structure of ","element":"span"},{"style":{"height":16},"width":250.02,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-35.png","element":"img","alt":" Zr(x1, . . . , xn)","inline":true,"padRight":true},{"text":"and enable us to show Lemma ","element":"span"},{"href":"#id-34","text":"2.1.","element":"a"}],[{"style":{"fontWeight":"bold"},"text":"2.2 ","element":"span"},{"style":{"fontWeight":"bold"},"text":"Obtaining bounds on ","element":"span"},{"style":{"fontStyle":"italic"},"text":"∥","element":"span"},{"style":{"fontStyle":"italic"},"text":"R","element":"span"},{"text":"(","element":"span"},{"style":{"fontStyle":"italic"},"text":"x","element":"span"},{"text":"1","element":"span"},{"style":{"fontStyle":"italic"},"text":", . . . , x","element":"span"},{"style":{"fontStyle":"italic"},"text":"n","element":"span"},{"text":")","element":"span"},{"style":{"fontStyle":"italic"},"text":"∥","element":"span"},{"style":{"fontStyle":"italic"},"text":"q","element":"span"}],[{"text":"Now, we use Lemma ","element":"span"},{"href":"#id-34","text":"2.1 ","element":"a"},{"text":"and Lemma ","element":"span"},{"href":"#id-35","text":"2.2 ","element":"a"},{"text":"to show the following bounds on ","element":"span"},{"style":{"height":19.18},"width":290.09,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-36.png","element":"img","alt":" ∥R(x1, . . . , xn)∥q","inline":true},{"text":":","element":"span"}],[{"id":"id-36","style":{"fontWeight":"bold"},"text":"Lemma 2.3 ","element":"span"},{"text":"Suppose ","element":"span"},{"style":{"height":16.39},"width":114.06,"height":40.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-37.png","element":"img","alt":" As,m,n","inline":true,"padRight":true},{"text":"is a sparse JL distribution such that ","element":"span"},{"style":{"height":16},"width":163.15,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-38.png","element":"img","alt":" s ≤ m/e","inline":true},{"text":", and let ","element":"span"},{"style":{"height":16},"width":289.08,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-39.png","element":"img","alt":" x = [x1, . . . , xn]","inline":true,"padRight":true},{"text":"be such that ","element":"span"},{"style":{"height":16.78},"width":162.93,"height":41.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-40.png","element":"img","alt":" ∥x∥2 = 1","inline":true},{"text":". Then, ","element":"span"},{"style":{"height":16.78},"width":339.69,"height":41.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-41.png","element":"img","alt":" ∥R(x1, . . . , xn)∥2 ≤","inline":true}],[{"style":{"height":16.78},"width":173.5,"height":41.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-42.png","element":"img","alt":"∥x∥∞ ≤ v","inline":true},{"text":". If ","element":"span"},{"style":{"height":16.57},"width":142.66,"height":41.43,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-43.png","element":"img","alt":"semv2 ≥ q","inline":true},{"text":", then ","element":"span"},{"style":{"height":25.21},"width":409.76,"height":63.03,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-44.png","element":"img","alt":" ∥R(x1, . . . , xn)∥q ≲ √q√m","inline":true},{"text":". If ","element":"span"},{"style":{"height":16.57},"width":142.66,"height":41.43,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-45.png","element":"img","alt":"semv2 < q","inline":true,"padRight":true},{"text":"and if there exists a constant ","element":"span"},{"style":{"height":13.2},"width":124.47,"height":33,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-46.png","element":"img","alt":" C2 ≥ 1","inline":true,"padRight":true},{"text":"such ","element":"span"},{"text":"that ","element":"span"},{"style":{"height":16.59},"width":244.88,"height":41.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-47.png","element":"img","alt":" C2q3mv4 ≥ s2","inline":true},{"text":", then ","element":"span"},{"style":{"height":19.18},"width":364.82,"height":47.95,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-48.png","element":"img","alt":" ∥R(x1, . . . , xn)∥q ≲ g","inline":true,"padRight":true},{"text":"where ","element":"span"},{"style":{"fontStyle":"italic"},"text":"g ","element":"span"},{"text":"is:","element":"span"}],[{"id":"id-37","style":{"width":"74%"},"width":1434,"height":294,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/5-49.png","element":"img"}],[{"style":{"fontWeight":"bold"},"text":"Lemma 2.4 ","element":"span"},{"text":"Suppose ","element":"span"},{"style":{"height":16.39},"width":114.05,"height":40.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-0.png","element":"img","alt":" As,m,n","inline":true,"padRight":true},{"text":"is a uniform sparse JL distribution. Let ","element":"span"},{"style":{"fontStyle":"italic"},"text":"q ","element":"span"},{"text":"be a power of ","element":"span"},{"text":"2","element":"span"},{"text":", and suppose that ","element":"span"},{"style":{"height":13.6},"width":230.63,"height":34,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-1.png","element":"img","alt":"0 < v ≤ 0.5","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":19.37},"width":30.94,"height":48.43,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-2.png","element":"img","alt":"1v2","inline":true,"padRight":true},{"text":"is an even integer. ","element":"span"},{"text":"If ","element":"span"},{"style":{"height":16.59},"width":146.32,"height":41.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-3.png","element":"img","alt":" qv2 ≤ s","inline":true},{"text":", then ","element":"span"},{"style":{"height":25.21},"width":523.62,"height":63.03,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-4.png","element":"img","alt":" ∥R(v, . . . , v, 0, . . . , 0)∥q ≳ √q√m","inline":true},{"text":". ","element":"span"},{"text":"If ","element":"span"},{"style":{"height":14},"width":224.34,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-5.png","element":"img","alt":" m ≥ q, 2 ≤","inline":true},{"style":{"height":17.39},"width":771.08,"height":43.47,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-6.png","element":"img","alt":"ln(qmv4/s2) ≤ q, 2qv2 ≤ 0.5s ln(qmv4/s2)","inline":true},{"text":", and ","element":"span"},{"style":{"height":16},"width":162.44,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-7.png","element":"img","alt":" s ≤ m/e","inline":true},{"text":", then ","element":"span"},{"style":{"height":25.82},"width":664.67,"height":64.54,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-8.png","element":"img","alt":" ∥R(v, . . . , v, 0, . . . , 0)∥q ≳ qv2s ln(qmv4/s2)","inline":true},{"text":". ","element":"span"},{"text":"If","element":"span"}],[{"style":{"width":"83%"},"width":1604,"height":70,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-9.png","element":"img"}],[{"text":"We now sketch how to prove bounds on ","element":"span"},{"style":{"height":19.18},"width":290.08,"height":47.95,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-10.png","element":"img","alt":" ∥R(x1, . . . , xn)∥q","inline":true,"padRight":true},{"text":"using bounds on ","element":"span"},{"style":{"height":16.78},"width":312.37,"height":41.95,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-11.png","element":"img","alt":" ∥Zr(x1, . . . , xn)∥T","inline":true,"padRight":true},{"text":". To show Lemma ","element":"span"},{"href":"#id-36","text":"2.3, ","element":"a"},{"text":"we show that making the row terms ","element":"span"},{"style":{"height":16},"width":250.02,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-12.png","element":"img","alt":" Zr(x1, . . . , xn)","inline":true,"padRight":true},{"text":"independent does not decrease ","element":"span"},{"style":{"height":19.18},"width":290.09,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-13.png","element":"img","alt":" ∥R(x1, . . . , xn)∥q","inline":true},{"text":", and then we apply a general result from ","element":"span"},{"href":"#id-33","referenceIndex":20,"text":"[20] ","element":"a"},{"text":"for moments of sums of i.i.d symmetric random variables. For Lemma ","element":"span"},{"href":"#id-37","text":"2.4, ","element":"a"},{"text":"handling the correlations between the row terms ","element":"span"},{"style":{"height":16},"width":250.02,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-14.png","element":"img","alt":" Zr(x1, . . . , xn)","inline":true,"padRight":true},{"text":"requires more care. We show that the negative correlations induced by having exactly ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"nonzero entries per column do not lead to significant loss, and then stitch together ","element":"span"},{"style":{"height":19.18},"width":392.58,"height":47.95,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-15.png","element":"img","alt":" ∥R(v, . . . , v, 0, . . . , 0)∥q","inline":true,"padRight":true},{"text":"using the moments of ","element":"span"},{"style":{"height":16},"width":352.52,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-16.png","element":"img","alt":" Zr(v, . . . , v, 0, . . . , 0)","inline":true,"padRight":true},{"text":"that contribute the most.","element":"span"}]]},{"heading":"3 Proof of Main Result from Moment Bounds","paragraphs":[[{"text":"We now sketch how to prove Theorem ","element":"span"},{"href":"#id-25","text":"1.5, ","element":"a"},{"text":"using Lemma ","element":"span"},{"href":"#id-36","text":"2.3 ","element":"a"},{"text":"and Lemma ","element":"span"},{"href":"#id-37","text":"2.4. ","element":"a"},{"text":"First, we simplify these bounds at the target parameters to obtain the following:","element":"span"}],[{"id":"id-38","style":{"fontWeight":"bold"},"text":"Lemma 3.1 ","element":"span"},{"text":"Let ","element":"span"},{"style":{"height":16.39},"width":114.06,"height":40.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-17.png","element":"img","alt":" As,m,n","inline":true,"padRight":true},{"text":"be a sparse JL distribution, and suppose ","element":"span"},{"style":{"height":0},"width":20,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-18.png","element":"img","alt":" ϵ","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":11.6},"width":19,"height":29,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-19.png","element":"img","alt":" δ","inline":true,"padRight":true},{"text":"are small enough, ","element":"span"},{"style":{"height":16},"width":168.14,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-20.png","element":"img","alt":" s ≤ m/e","inline":true},{"text":", ","element":"span"},{"style":{"height":17.39},"width":990.04,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-21.png","element":"img","alt":"Θ(ϵ−2 ln(1/δ)) ≤ m < 2ϵ−2/δ, v ≤ f ′(m, ϵ, ln(1/δ), s)","inline":true},{"text":", and ","element":"span"},{"style":{"height":16},"width":279.38,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-22.png","element":"img","alt":" p = Θ(ln(1/δ))","inline":true,"padRight":true},{"text":"is even. ","element":"span"},{"text":"If ","element":"span"},{"style":{"height":16},"width":292.08,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-23.png","element":"img","alt":" x = [x1, . . . , xn]","inline":true,"padRight":true},{"text":"satisfies ","element":"span"},{"style":{"height":16.78},"width":168.52,"height":41.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-24.png","element":"img","alt":" ∥x∥∞ ≤ v","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":16.78},"width":153.66,"height":41.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-25.png","element":"img","alt":" ∥x∥2 = 1","inline":true},{"text":", then ","element":"span"},{"style":{"height":19.18},"width":367.42,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-26.png","element":"img","alt":" ∥R(x1, . . . , xn)∥p ≤ ϵ2","inline":true},{"text":".","element":"span"}],[{"id":"id-39","style":{"fontWeight":"bold"},"text":"Lemma 3.2 ","element":"span"},{"text":"There is a universal constant ","element":"span"},{"style":{"fontStyle":"italic"},"text":"D ","element":"span"},{"text":"satisfying the following property. Let ","element":"span"},{"style":{"height":16.39},"width":114.05,"height":40.97,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-27.png","element":"img","alt":" As,m,n","inline":true,"padRight":true},{"text":"be a uniform sparse JL distribution, and suppose ","element":"span"},{"style":{"height":14.8},"width":52.92,"height":37,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-28.png","element":"img","alt":" ϵ, δ","inline":true,"padRight":true},{"text":"are small enough, ","element":"span"},{"style":{"height":16},"width":585.29,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-29.png","element":"img","alt":" s ≤ m/e, f ′(m, ϵ, ln(1/δ), s) ≤ 0.5","inline":true},{"text":", and ","element":"span"},{"style":{"fontStyle":"italic"},"text":"q ","element":"span"},{"text":"is an even integer such that ","element":"span"},{"style":{"height":16},"width":463.82,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-30.png","element":"img","alt":" q = min(m/2, Θ(ln(1/δ)))","inline":true},{"text":". For each ","element":"span"},{"style":{"height":14},"width":116.25,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-31.png","element":"img","alt":" ψ > 0","inline":true},{"text":", there exists ","element":"span"},{"style":{"height":16},"width":482.84,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-32.png","element":"img","alt":" v ≤ f ′(m, ϵ, ln(1/δ), s) + ψ","inline":true},{"text":", such that ","element":"span"},{"style":{"height":19.18},"width":488.24,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-33.png","element":"img","alt":"∥R(v, . . . , v, 0, . . . , 0)∥q ≥ 2ϵ","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":29.16},"width":371.78,"height":72.9,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-34.png","element":"img","alt":"∥R(v,...,v,0,...,0)∥q∥R(v,...,v,0,...,0)∥2q ≥ D","inline":true},{"text":".","element":"span"}],[{"text":"Now, we use Lemma ","element":"span"},{"href":"#id-38","text":"3.1 ","element":"a"},{"text":"and Lemma ","element":"span"},{"href":"#id-39","text":"3.2 ","element":"a"},{"text":"to prove Theorem ","element":"span"},{"href":"#id-25","text":"1.5.","element":"a"}],[{"style":{"fontStyle":"italic"},"text":"Proof of Theorem ","element":"span"},{"text":"1","element":"span"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"href":"#id-25","text":"5","element":"a"},{"style":{"fontStyle":"italic"},"text":". ","element":"span"},{"text":"Since the maps in ","element":"span"},{"style":{"height":16.39},"width":114.05,"height":40.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-35.png","element":"img","alt":" As,m,n","inline":true,"padRight":true},{"text":"are linear, it suffices to consider unit vectors ","element":"span"},{"style":{"fontStyle":"italic"},"text":"x","element":"span"},{"text":". First, we prove the lower bound on ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-36.png","element":"img","alt":" v(m, ϵ, δ, s)","inline":true},{"text":". To handle ","element":"span"},{"style":{"height":17.38},"width":208.46,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-37.png","element":"img","alt":" m ≥ 2ϵ−2/δ","inline":true},{"text":", we take ","element":"span"},{"style":{"fontStyle":"italic"},"text":"q ","element":"span"},{"text":"= 2 ","element":"span"},{"text":"in Lemma ","element":"span"},{"href":"#id-38","text":"3.1 ","element":"a"},{"text":"and apply Chebyshev’s inequality. Otherwise, we take ","element":"span"},{"style":{"height":16},"width":205.62,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-38.png","element":"img","alt":" p = ln(1/δ)","inline":true,"padRight":true},{"text":"(approximately) and apply Lemma ","element":"span"},{"href":"#id-38","text":"3.1 ","element":"a"},{"text":"and Markov’s inequality. We see that ","element":"span"},{"style":{"height":20.4},"width":323.54,"height":50.99,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-39.png","element":"img","alt":" P[| ∥Ax∥22 − 1| ≥ ϵ]","inline":true,"padRight":true},{"text":"can be expressed as:","element":"span"}],[{"style":{"width":"68%"},"width":1307,"height":39,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-40.png","element":"img"}],[{"text":"Thus, condition ","element":"span"},{"href":"#id-6","text":"(1) ","element":"a"},{"text":"is satisfied for ","element":"span"},{"style":{"height":13.19},"width":111.92,"height":32.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-41.png","element":"img","alt":" x ∈ Sv","inline":true,"padRight":true},{"text":"when ","element":"span"},{"style":{"height":16},"width":386.6,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-42.png","element":"img","alt":" v ≤ f ′(m, ϵ, ln(1/δ), s)","inline":true,"padRight":true},{"text":"as desired.","element":"span"}],[{"text":"Now, we prove the upper bound on ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-43.png","element":"img","alt":" v(m, ϵ, δ, s)","inline":true},{"text":". We need to lower bound the tail probability of ","element":"span"},{"style":{"fontStyle":"italic"},"text":"R","element":"span"},{"text":"(","element":"span"},{"style":{"fontStyle":"italic"},"text":"v, . . . , v, ","element":"span"},{"text":"0","element":"span"},{"style":{"fontStyle":"italic"},"text":", . . . , ","element":"span"},{"text":"0)","element":"span"},{"text":", and to do this, we use the Paley-Zygmund inequality applied to ","element":"span"},{"style":{"fontStyle":"italic"},"text":"q","element":"span"},{"text":"th moments. Let ","element":"span"},{"style":{"fontStyle":"italic"},"text":"D ","element":"span"},{"text":"be defined as in Lemma ","element":"span"},{"href":"#id-39","text":"3.2, ","element":"a"},{"text":"and take ","element":"span"},{"style":{"height":24.43},"width":564.46,"height":61.07,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-44.png","element":"img","alt":" q = min(m/2, max(2, ln(1/δ)−2−2 ln(D) ))","inline":true},{"text":". By the Paley-Zygmund inequality and ","element":"span"},{"text":"Lemma ","element":"span"},{"href":"#id-39","text":"3.2, ","element":"a"},{"text":"there exists ","element":"span"},{"style":{"height":16},"width":460.81,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-45.png","element":"img","alt":" v ≤ f ′(m, ϵ, ln(1/δ), s) + ψ","inline":true,"padRight":true},{"text":"such that:","element":"span"}],[{"style":{"width":"74%"},"width":1432,"height":129,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-46.png","element":"img"}],[{"text":"Thus, it follows that ","element":"span"},{"style":{"height":24.44},"width":893.58,"height":61.1,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-47.png","element":"img","alt":" supx∈Sf′(m,ϵ,ln(1/δ),s)+ψ,∥x∥2=1 P[| ∥Ax∥22 − 1| > ϵ] > δ","inline":true,"padRight":true},{"text":"as desired.","element":"span"}]]},{"heading":"4 Empirical Evaluation","paragraphs":[[{"text":"Recall that for sparse JL distributions with sparsity ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s","element":"span"},{"text":", the projection time for an input vector ","element":"span"},{"style":{"fontStyle":"italic"},"text":"x ","element":"span"},{"text":"is ","element":"span"},{"style":{"height":16.78},"width":168.82,"height":41.95,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-48.png","element":"img","alt":" O(s ∥x∥0)","inline":true},{"text":", where ","element":"span"},{"style":{"height":16.78},"width":78.63,"height":41.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-49.png","element":"img","alt":" ∥x∥0","inline":true,"padRight":true},{"text":"is the number of nonzero entries in ","element":"span"},{"style":{"fontStyle":"italic"},"text":"x","element":"span"},{"text":". Since this grows linearly in ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s","element":"span"},{"text":", in order to minimize the impact on projection time, we restrict to small constant ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"values (i.e. ","element":"span"},{"style":{"height":13.2},"width":198.04,"height":33,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/6-50.png","element":"img","alt":" 1 ≤ s ≤ 16","inline":true},{"text":"). In Section ","element":"span"},{"href":"#id-40","text":"4.1, ","element":"a"},{"text":"we demonstrate on real-world data the benefits of using ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s > ","element":"span"},{"text":"1","element":"span"},{"text":". In Section ","element":"span"},{"href":"#id-41","text":"4.2, ","element":"a"},{"text":"we illustrate trends in our theoretical bounds on synthetic data. Additional graphs can be found in Appendix ","element":"span"},{"text":"I. ","element":"span"},{"text":"For all experiments, we use a block sparse JL distribution to demonstrate that our theoretical upper bounds also empirically generalize to non-uniform sparse JL distributions.","element":"span"}],[{"id":"id-40","style":{"fontWeight":"bold"},"text":"4.1 ","element":"span"},{"style":{"fontWeight":"bold"},"text":"Real-World Datasets","element":"span"}],[{"text":"We considered two bag-of-words datasets: the News20 dataset ","element":"span"},{"href":"#id-42","referenceIndex":1,"text":"[1] ","element":"a"},{"text":"(based on newsgroup documents), and the Enron email dataset ","element":"span"},{"href":"#id-43","referenceIndex":26,"text":"[26] ","element":"a"},{"text":"(based on e-mails from the senior management of Enron).","element":"span"},{"style":{"height":7.6},"width":31.88,"height":19,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-0.png","element":"img","alt":"12","inline":true,"padRight":true},{"text":"Both datasets were pre-processed with the standard ","element":"span"},{"style":{"fontFamily":"monospace"},"text":"tf-idf ","element":"span"},{"text":"preprocessing. In this experiment, we evaluated how well sparse JL preserves the ","element":"span"},{"style":{"height":7.6},"width":32.6,"height":19,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-1.png","element":"img","alt":" ℓ2","inline":true,"padRight":true},{"text":"norms of the vectors in the dataset. An interesting direction for future work would be to empirically evaluate how well sparse JL preserves other aspects of the geometry of real-world data sets, such as the ","element":"span"},{"style":{"height":7.6},"width":32.6,"height":19,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-2.png","element":"img","alt":" ℓ2","inline":true,"padRight":true},{"text":"distances between pairs of vectors.","element":"span"}],[{"text":"In our experiment, we estimated the failure probability ","element":"span"},{"style":{"height":19.01},"width":155.98,"height":47.52,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-3.png","element":"img","alt":"ˆδ(s, m, ϵ)","inline":true,"padRight":true},{"text":"for each dataset as follows. Let ","element":"span"},{"style":{"fontStyle":"italic"},"text":"D ","element":"span"},{"text":"be the number of vectors in the dataset, and let ","element":"span"},{"style":{"fontStyle":"italic"},"text":"n ","element":"span"},{"text":"be the dimension (","element":"span"},{"style":{"fontStyle":"italic"},"text":"n ","element":"span"},{"text":"= 101631","element":"span"},{"text":", ","element":"span"},{"style":{"fontStyle":"italic"},"text":"D ","element":"span"},{"text":"= 11314 ","element":"span"},{"text":"for News20; ","element":"span"},{"style":{"fontStyle":"italic"},"text":"n ","element":"span"},{"text":"= 28102","element":"span"},{"text":", ","element":"span"},{"style":{"fontStyle":"italic"},"text":"D ","element":"span"},{"text":"= 39861 ","element":"span"},{"text":"for Enron). We drew a matrix ","element":"span"},{"style":{"height":16.39},"width":225.26,"height":40.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-4.png","element":"img","alt":" M ∼ As,m,n","inline":true,"padRight":true},{"text":"from a block sparse JL distribution. Then, we computed ","element":"span"},{"style":{"height":26.01},"width":98.11,"height":65.03,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-5.png","element":"img","alt":"∥Mx∥2∥x∥2","inline":true,"padRight":true},{"text":"for each vector ","element":"span"},{"style":{"fontStyle":"italic"},"text":"x ","element":"span"},{"text":"in the dataset, and used these values to compute an estimate ","element":"span"},{"style":{"height":29.62},"width":828.46,"height":74.05,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-6.png","element":"img","alt":"ˆδ(s, m, ϵ) = number of vectors x such that∥Mx∥2∥x∥2 ̸∈1±ϵD","inline":true,"padRight":true},{"text":". We ran 100 trials to produce 100 estimates ","element":"span"},{"style":{"height":19.01},"width":155.98,"height":47.52,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-7.png","element":"img","alt":"ˆδ(s, m, ϵ)","inline":true},{"text":".","element":"span"}],[{"id":"id-44","style":{"width":"88%"},"width":1696,"height":537,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-8.png","element":"img"}],[{"text":"Figure 1: News20: ","element":"figcaption","subtype":"caption"},{"style":{"height":19.01},"width":210.66,"height":47.52,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-9.png","element":"img","alt":"ˆδ(m, s, 0.07)","inline":true,"padRight":true},{"text":"v. ","element":"figcaption","subtype":"caption"},{"style":{"fontStyle":"italic"},"text":"s","element":"figcaption","subtype":"caption"}],[{"text":"Figure 2: Enron: ","element":"figcaption","subtype":"caption"},{"style":{"height":19.01},"width":210.65,"height":47.52,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-10.png","element":"img","alt":"ˆδ(m, s, 0.07)","inline":true,"padRight":true},{"text":"vs. ","element":"figcaption","subtype":"caption"},{"style":{"fontStyle":"italic"},"text":"s","element":"figcaption","subtype":"caption"}],[{"text":"Figure ","element":"span"},{"href":"#id-44","text":"1 ","element":"a"},{"text":"and Figure ","element":"span"},{"href":"#id-44","text":"2 ","element":"a"},{"text":"show the mean and error bars (3 standard errors of the mean) of ","element":"span"},{"style":{"height":19.01},"width":155.98,"height":47.52,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-11.png","element":"img","alt":"ˆδ(s, m, ϵ)","inline":true,"padRight":true},{"text":"at ","element":"span"},{"style":{"height":11.6},"width":140.23,"height":29,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-12.png","element":"img","alt":" ϵ = 0.07","inline":true},{"text":". We consider ","element":"span"},{"style":{"height":16},"width":297.71,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-13.png","element":"img","alt":" s ∈ {1, 2, 4, 8, 16}","inline":true},{"text":", and choose ","element":"span"},{"style":{"fontStyle":"italic"},"text":"m ","element":"span"},{"text":"values so that ","element":"span"},{"style":{"height":19.01},"width":404.76,"height":47.52,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-14.png","element":"img","alt":" 0.01 ≤ ˆδ(1, m, ϵ) ≤ 0.04","inline":true},{"text":".","element":"span"}],[{"text":"All of the plots show that ","element":"span"},{"style":{"height":16},"width":260.07,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-15.png","element":"img","alt":" s ∈ {2, 4, 8, 16}","inline":true,"padRight":true},{"text":"achieves a lower failure probability than ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"= 1","element":"span"},{"text":", with the differences most pronounced when ","element":"span"},{"style":{"fontStyle":"italic"},"text":"m ","element":"span"},{"text":"is larger. In fact, at ","element":"span"},{"style":{"fontStyle":"italic"},"text":"m ","element":"span"},{"text":"= 1000","element":"span"},{"text":", there is a ","element":"span"},{"style":{"fontStyle":"italic"},"text":"factor of four ","element":"span"},{"text":"decrease in ","element":"span"},{"style":{"height":11.6},"width":19,"height":29,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-16.png","element":"img","alt":" δ","inline":true,"padRight":true},{"text":"between ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"= 1 ","element":"span"},{"text":"and ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"= 4","element":"span"},{"text":", and a ","element":"span"},{"style":{"fontStyle":"italic"},"text":"factor of ten ","element":"span"},{"text":"decrease between ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"= 1 ","element":"span"},{"text":"and ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"= 8","element":"span"},{"style":{"fontStyle":"italic"},"text":", ","element":"span"},{"text":"16","element":"span"},{"text":". We note that in plots in the Appendix, there is a slight increase between ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"= 8 ","element":"span"},{"text":"and ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"= 16 ","element":"span"},{"text":"at some ","element":"span"},{"style":{"height":14.8},"width":103.62,"height":37,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-17.png","element":"img","alt":" ϵ, δ, m","inline":true,"padRight":true},{"text":"values (see Appendix ","element":"span"},{"text":"I ","element":"span"},{"text":"for a discussion of this non-monotonicity in ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s","element":"span"},{"text":"); however ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s > ","element":"span"},{"text":"1 ","element":"span"},{"text":"still consistently beats ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"= 1","element":"span"},{"text":". Thus, these findings demonstrate the potential benefits of using small constants ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s > ","element":"span"},{"text":"1 ","element":"span"},{"text":"in sparse JL in practice, which aligns with our theoretical results.","element":"span"}],[{"id":"id-41","style":{"fontWeight":"bold"},"text":"4.2 ","element":"span"},{"style":{"fontWeight":"bold"},"text":"Synthetic Datasets","element":"span"}],[{"text":"We used synthetic data to illustrate the phase transitions in our bounds on ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-18.png","element":"img","alt":" v(m, ϵ, δ, s)","inline":true,"padRight":true},{"text":"in Theorem ","element":"span"},{"href":"#id-25","text":"1.5 ","element":"a"},{"text":"for a block sparse JL distribution. For several choices of ","element":"span"},{"style":{"height":14.8},"width":142.02,"height":37,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-19.png","element":"img","alt":" s, m, ϵ, δ","inline":true},{"text":", we computed an estimate ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-20.png","element":"img","alt":" ˆv(m, ϵ, δ, s)","inline":true,"padRight":true},{"text":"of ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-21.png","element":"img","alt":" v(m, ϵ, δ, s)","inline":true,"padRight":true},{"text":"as follows. Our experiment borrowed aspects of the experimental design in ","element":"span"},{"href":"#id-18","referenceIndex":13,"text":"[13]","element":"a"},{"text":". Our synthetic data consisted of binary vectors (i.e. ","element":"span"},{"text":"vectors whose entries are in ","element":"span"},{"style":{"fontStyle":"italic"},"text":"{","element":"span"},{"text":"0","element":"span"},{"style":{"fontStyle":"italic"},"text":", ","element":"span"},{"text":"1","element":"span"},{"style":{"fontStyle":"italic"},"text":"}","element":"span"},{"text":"). ","element":"span"},{"text":"The binary vectors were defined by a set ","element":"span"},{"style":{"fontStyle":"italic"},"text":"W ","element":"span"},{"text":"of values exponentially spread between ","element":"span"},{"text":"0","element":"span"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"03 ","element":"span"},{"text":"and ","element":"span"},{"style":{"height":13.38},"width":51.8,"height":33.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-22.png","element":"img","alt":" 113","inline":true},{"text":": for each ","element":"span"},{"style":{"height":11.6},"width":133.52,"height":29,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-23.png","element":"img","alt":" w ∈ W","inline":true},{"text":", we constructed a binary vector ","element":"span"},{"style":{"height":10.98},"width":45.78,"height":27.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-24.png","element":"img","alt":" xw","inline":true,"padRight":true},{"text":"where the first ","element":"span"},{"style":{"height":17.38},"width":85.45,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-25.png","element":"img","alt":" 1/w2","inline":true,"padRight":true},{"text":"entries are nonzero, and computed an estimate ","element":"span"},{"style":{"height":19.01},"width":203.3,"height":47.52,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-26.png","element":"img","alt":"ˆδ(s, m, ϵ, w)","inline":true,"padRight":true},{"text":"of the failure probability of the block sparse JL distribution on the specific vector ","element":"span"},{"style":{"height":10.98},"width":45.78,"height":27.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-27.png","element":"img","alt":" xw","inline":true,"padRight":true},{"text":"(i.e. ","element":"span"},{"style":{"height":20.03},"width":668.97,"height":50.08,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-28.png","element":"img","alt":" PA∈As,m,1/w2 [∥Axw∥2 ̸∈ (1 ± ϵ) ∥xw∥2]","inline":true},{"text":"). We computed each ","element":"span"},{"style":{"height":19.01},"width":203.3,"height":47.52,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-29.png","element":"img","alt":"ˆδ(s, m, ϵ, w)","inline":true,"padRight":true},{"text":"using 100,000 samples from a block sparse JL distribution, as follows. In each sample, we independently drew a matrix ","element":"span"},{"style":{"height":17.28},"width":271.64,"height":43.2,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-30.png","element":"img","alt":" M ∼ As,m,1/w2","inline":true,"padRight":true},{"text":"and computed the ratio ","element":"span"},{"style":{"height":26.42},"width":120.74,"height":66.06,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/7-31.png","element":"img","alt":"∥Mxw∥2∥xw∥2","inline":true,"padRight":true},{"text":". Then, we took ","element":"span"},{"style":{"height":19.01},"width":288.58,"height":47.52,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/8-0.png","element":"img","alt":"ˆδ(s, m, ϵ, w) := (","inline":true},{"text":"number of samples where ","element":"span"},{"style":{"height":26.42},"width":332.77,"height":66.06,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/8-1.png","element":"img","alt":"∥Mxw∥2∥xw∥2 ̸∈ 1 ± ϵ)/T","inline":true},{"text":". Finally, we used the estimates ","element":"span"},{"style":{"height":19.01},"width":203.3,"height":47.52,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/8-2.png","element":"img","alt":"ˆδ(s, m, ϵ, w)","inline":true,"padRight":true},{"text":"to obtain the estimate ","element":"span"},{"style":{"height":29.2},"width":773.01,"height":73,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/8-3.png","element":"img","alt":" ˆv(m, ϵ, δ, s) = max�v ∈ W | ˆδ(s, m, ϵ, w) < δ","inline":true,"padRight":true},{"text":"for all ","element":"span"},{"style":{"height":11.6},"width":120.31,"height":29,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/8-4.png","element":"img","alt":" w ∈ W","inline":true,"padRight":true},{"text":"where ","element":"span"},{"style":{"height":28.8},"width":130.48,"height":72,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/8-5.png","element":"img","alt":" w ≤ v�","inline":true},{"text":".","element":"span"}],[{"id":"id-45","style":{"width":"100%"},"width":1928,"height":883,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/8-6.png","element":"img"}],[{"text":"Figure 3: Phase transitions of ","element":"figcaption","subtype":"caption"},{"style":{"height":16},"width":280.82,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/8-7.png","element":"img","alt":" ˆv(m, 0.1, 0.01, s)","inline":true}],[{"text":"Figure 4: Phase transitions of ","element":"figcaption","subtype":"caption"},{"style":{"height":16},"width":300.74,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/8-8.png","element":"img","alt":" ˆv(m, 0.05, 0.05, s)","inline":true}],[{"text":"Figure ","element":"span"},{"href":"#id-45","text":"3 ","element":"a"},{"text":"and Figure ","element":"span"},{"href":"#id-45","text":"4 ","element":"a"},{"text":"show ","element":"span"},{"style":{"height":16},"width":192.22,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/8-9.png","element":"img","alt":" ˆv(m, ϵ, δ, s)","inline":true,"padRight":true},{"text":"as a function of dimension ","element":"span"},{"style":{"fontStyle":"italic"},"text":"m ","element":"span"},{"text":"for ","element":"span"},{"style":{"height":16},"width":279.74,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/8-10.png","element":"img","alt":" s ∈ {1, 2, 3, 4, 8}","inline":true,"padRight":true},{"text":"for two settings of ","element":"span"},{"style":{"height":0},"width":20,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/8-11.png","element":"img","alt":" ϵ","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":11.6},"width":19,"height":29,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/8-12.png","element":"img","alt":" δ","inline":true},{"text":". The error-bars are based on the distance to the next highest ","element":"span"},{"style":{"fontStyle":"italic"},"text":"v ","element":"span"},{"text":"value in ","element":"span"},{"style":{"fontStyle":"italic"},"text":"W","element":"span"},{"text":".","element":"span"}],[{"text":"Our first observation is that for each set of ","element":"span"},{"style":{"height":14.8},"width":89.3,"height":37,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/8-13.png","element":"img","alt":" s, ϵ, δ","inline":true,"padRight":true},{"text":"values considered, the curve ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/8-14.png","element":"img","alt":" ˆv(m, ϵ, δ, s)","inline":true,"padRight":true},{"text":"has “sharp” changes as a function of ","element":"span"},{"style":{"fontStyle":"italic"},"text":"m","element":"span"},{"text":". More specifically, ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/8-15.png","element":"img","alt":" ˆv(m, ϵ, δ, s)","inline":true,"padRight":true},{"text":"is ","element":"span"},{"text":"0 ","element":"span"},{"text":"at small ","element":"span"},{"style":{"fontStyle":"italic"},"text":"m","element":"span"},{"text":", then there is a phase transition to a nonzero value, then an increase to a higher value, then an interval where the value appears “flat”, and lastly a second phase transition to ","element":"span"},{"text":"1","element":"span"},{"text":". The first phase transition is shared between ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"values, but the second phase transition occurs at different dimensions ","element":"span"},{"style":{"fontStyle":"italic"},"text":"m ","element":"span"},{"text":"(but is within a factor of ","element":"span"},{"text":"3 ","element":"span"},{"text":"between ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"values). Here, the first phase transition likely corresponds to ","element":"span"},{"style":{"height":17.39},"width":251.37,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/8-16.png","element":"img","alt":" Θ(ϵ−2 ln(1/δ))","inline":true,"padRight":true},{"text":"and the second phase transition likely corresponds to ","element":"span"},{"style":{"height":28.8},"width":812.6,"height":72,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/8-17.png","element":"img","alt":" min�ϵ−2eΘ(ln(1/δ)), ϵ−2 ln(1/δ)eΘ(ln(1/δ)ϵ−1/s)�","inline":true},{"text":".","element":"span"}],[{"text":"Our second observation is that as ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"increases, the “flat” part occurs at a higher y-coordinate. Here, the increase in the “flat” y-coordinate as a function of ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"corresponds to the ","element":"span"},{"style":{"height":16},"width":52.2,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/8-18.png","element":"img","alt":"√s","inline":true,"padRight":true},{"text":"term in ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/8-19.png","element":"img","alt":" v(m, ϵ, δ, s)","inline":true},{"text":". Technically, according to Theorem ","element":"span"},{"href":"#id-25","text":"1.5, ","element":"a"},{"text":"the “flat” parts should be increasing in ","element":"span"},{"style":{"fontStyle":"italic"},"text":"m ","element":"span"},{"text":"at a slow rate: the empirical “flatness” likely arises since ","element":"span"},{"style":{"fontStyle":"italic"},"text":"W ","element":"span"},{"text":"is a finite set in the experiments.","element":"span"}],[{"text":"Our third observation is that ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s > ","element":"span"},{"text":"1 ","element":"span"},{"text":"generally outperforms ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"= 1 ","element":"span"},{"text":"as Theorem ","element":"span"},{"href":"#id-25","text":"1.5 ","element":"a"},{"text":"suggests: that is, ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s > ","element":"span"},{"text":"1 ","element":"span"},{"text":"generally attains a higher ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/8-20.png","element":"img","alt":" ˆv(m, ϵ, δ, s)","inline":true,"padRight":true},{"text":"value than ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"= 1","element":"span"},{"text":". We note at large ","element":"span"},{"style":{"fontStyle":"italic"},"text":"m ","element":"span"},{"text":"values (where ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/8-21.png","element":"img","alt":" ˆv(m, ϵ, δ, s)","inline":true,"padRight":true},{"text":"is close to ","element":"span"},{"text":"1","element":"span"},{"text":"), lower ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"settings sometimes attain a higher ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/8-22.png","element":"img","alt":" ˆv(m, ϵ, δ, s)","inline":true,"padRight":true},{"text":"than higher ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"settings (e.g. the second phase transition doesn’t quite occur in decreasing order of ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"in Figure ","element":"span"},{"href":"#id-45","text":"3)","element":"a"},{"text":": see Appendix ","element":"span"},{"text":"I ","element":"span"},{"text":"for a discussion of this non-monotonicity in ","element":"span"},{"style":{"height":13.39},"width":61.62,"height":33.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/8-23.png","element":"img","alt":" s.15","inline":true,"padRight":true},{"text":"Nonetheless, in practice, it’s unlikely to select such a large dimension ","element":"span"},{"style":{"fontStyle":"italic"},"text":"m","element":"span"},{"text":", since the ","element":"span"},{"style":{"height":5.2},"width":48.61,"height":13,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/8-24.png","element":"img","alt":"ℓ∞","inline":true},{"text":"-to-","element":"span"},{"style":{"height":7.6},"width":32.6,"height":19,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/8-25.png","element":"img","alt":"ℓ2","inline":true,"padRight":true},{"text":"guarantees of smaller ","element":"span"},{"style":{"fontStyle":"italic"},"text":"m ","element":"span"},{"text":"are likely sufficient. Hence, a greater sparsity generally leads to a better ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/8-26.png","element":"img","alt":"ˆv(m, ϵ, δ, s)","inline":true,"padRight":true},{"text":"value, thus aligning with our theoretical findings.","element":"span"}]]},{"heading":"References","paragraphs":[[{"id":"id-42","text":"[1] The 20 newsgroups text dataset. ","element":"span"},{"href":"https://scikit-learn.org/0.19/datasets/twenty_newsgroups.html","style":{"fontFamily":"monospace"},"text":"https://scikit-learn.org/0.19/datasets/twenty_newsgroups. ","element":"a"},{"href":"https://scikit-learn.org/0.19/datasets/twenty_newsgroups.html","style":{"fontFamily":"monospace"},"text":"html","element":"a"},{"text":".","element":"span"}],[{"id":"id-12","text":"[2] D. Achlioptas. Database-friendly random projections: Johnson-lindenstrauss with binary coins. ","element":"span"},{"style":{"fontStyle":"italic"},"text":"J. Comput. Syst. Sci.","element":"span"},{"text":", 66(4):671–687, June 2003.","element":"span"}],[{"id":"id-28","text":"[3] Z. Allen-Zhu, R. Gelashvili, S. Micali, and N. Shavit. ","element":"span"},{"text":"Sparse sign-consistent Johnson–Lindenstrauss matrices: Compression with neuroscience-based constraints. In ","element":"span"},{"style":{"fontStyle":"italic"},"text":"Proceedings of the National Academy of Sciences (PNAS)","element":"span"},{"text":", volume 111, pages 16872–16876, 2014.","element":"span"}],[{"id":"id-3","text":"[4] Bing Bai, Jason Weston, David Grangier, Ronan Collobert, Kunihiko Sadamasa, Yanjun Qi, Olivier ","element":"span"},{"text":"Chapelle, and Kilian Weinberger. Learning to rank with (a lot of) word features. ","element":"span"},{"style":{"fontStyle":"italic"},"text":"Information Retrieval","element":"span"},{"text":", 13(3):291–314, Jun 2010.","element":"span"}],[{"id":"id-5","text":"[5] C. Caragea, A. Silvescu, and P. Mitra. Protein sequence classification using feature hashing. ","element":"span"},{"style":{"fontStyle":"italic"},"text":"Proteome Science","element":"span"},{"text":", 10(1), 2012.","element":"span"}],[{"id":"id-24","text":"[6] C. Chen, C. Vong, C. Wong, W. Wang, and P. Wong. Efficient extreme learning machine via very sparse ","element":"span"},{"text":"random projection. ","element":"span"},{"style":{"fontStyle":"italic"},"text":"Soft Computing","element":"span"},{"text":", 22, 03 2018.","element":"span"}],[{"id":"id-4","text":"[7] W. Chen, J. Wilson, S. Tyree, K. Q. Weinberger, and Y. Chen. Compressing neural networks with the ","element":"span"},{"text":"hashing trick. ","element":"span"},{"style":{"fontStyle":"italic"},"text":"Proceedings of the 32nd Annual International Conference on Machine Learning (ICML)","element":"span"},{"text":", pages 2285–2294, 2015.","element":"span"}],[{"id":"id-15","text":"[8] M. B. Cohen. Nearly tight oblivious subspace embeddings by trace inequalities. In ","element":"span"},{"style":{"fontStyle":"italic"},"text":"Proceedings of the Twenty-Seventh Annual ACM-SIAM Symposium on Discrete Algorithms (SODA)","element":"span"},{"text":", pages 278–287, 2016.","element":"span"}],[{"id":"id-30","text":"[9] M. B. Cohen, T. S. Jayram, and J. Nelson. Simple analyses of the sparse Johnson-Lindenstrauss transform. ","element":"span"},{"text":"In ","element":"span"},{"style":{"fontStyle":"italic"},"text":"Proceedings of the 1st Symposium on Simplicity in Algorithms (SOSA)","element":"span"},{"text":", pages 1–9, 2018.","element":"span"}],[{"id":"id-20","text":"[10] S. Dahlgaard, M. Knudsen, and M. Thorup. Practical hash functions for similarity estimation and dimen- ","element":"span"},{"text":"sionality reduction. In ","element":"span"},{"style":{"fontStyle":"italic"},"text":"Proceedings of the 31st International Conference on Neural Information Processing Systems (NIPS)","element":"span"},{"text":", pages 6618–6628, 2017.","element":"span"}],[{"id":"id-0","text":"[11] B. Dalessandro. ","element":"span"},{"text":"Bring the noise: Embracing randomness is the key to scaling up machine learning algorithms. ","element":"span"},{"style":{"fontStyle":"italic"},"text":"Big Data","element":"span"},{"text":", 1(2):110–112, 2013.","element":"span"}],[{"id":"id-14","text":"[12] A. Dasgupta, R. Kumar, and T. Sarlos. A sparse Johnson-Lindenstrauss transform. In ","element":"span"},{"style":{"fontStyle":"italic"},"text":"Proceedings of the 42nd ACM Symposium on Theory of Computing (STOC)","element":"span"},{"text":", pages 341–350, 2010.","element":"span"}],[{"id":"id-18","text":"[13] C. Freksen, L. Kamma, and K. G. Larsen. Fully understanding the hashing trick. In ","element":"span"},{"style":{"fontStyle":"italic"},"text":"Proceedings of the 32nd International Conference on Neural Information Processing Systems (NeurIPS)","element":"span"},{"text":", pages 5394–5404, 2018.","element":"span"}],[{"id":"id-31","text":"[14] M. Jagadeesan. Simple analysis of sparse, sign-consistent JL. In ","element":"span"},{"style":{"fontStyle":"italic"},"text":"Proceedings of the 23rd International Conference and 24th International Conference on Approximation, Randomization, and Combinatorial Optimization: Algorithms and Techniques (RANDOM)","element":"span"},{"text":", pages 61:1–61:20, 2019.","element":"span"}],[{"id":"id-9","text":"[15] T.S. Jayram and D. P. Woodruff. ","element":"span"},{"text":"Optimal bounds for Johnson-Lindenstrauss transforms and steaming problems with subconstant error. In ","element":"span"},{"style":{"fontStyle":"italic"},"text":"ACM Transactions on Algorithms (TALG) - Special Issue on ","element":"span"},{"style":{"height":12},"width":164.22,"height":30,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/9-0.png","element":"img","alt":"SODA’11","inline":true},{"text":", volume 9, pages 1–26, 2013.","element":"span"}],[{"id":"id-7","text":"[16] W. B. Johnson and J. Lindenstrauss. Extensions of Lipschitz mappings into a Hilbert space. ","element":"span"},{"style":{"fontStyle":"italic"},"text":"Contemporary Mathematics","element":"span"},{"text":", 26:189–206, 1984.","element":"span"}],[{"id":"id-8","text":"[17] D. M. Kane, R. Meka, and J. Nelson. Almost optimal explicit Johnson-Lindenstrauss families. In ","element":"span"},{"style":{"fontStyle":"italic"},"text":"Proceedings of the 14th International Workshop and 15th International Conference on Approximation, Randomization, and Combinatorial Optimization: Algorithms and Techniques (RANDOM)","element":"span"},{"text":", pages 628–639, 2011.","element":"span"}],[{"id":"id-19","text":"[18] D. M. Kane and J. Nelson. ","element":"span"},{"text":"A derandomized sparse Johnson-Lindenstrauss transform. ","element":"span"},{"style":{"fontStyle":"italic"},"text":"CoRR","element":"span"},{"text":", abs/1006.3585, 2010.","element":"span"}],[{"id":"id-10","text":"[19] D. M. Kane and J. Nelson. Sparser Johnson-Lindenstrauss transforms. In ","element":"span"},{"style":{"fontStyle":"italic"},"text":"Proceedings of the 23rd Annual ACM-SIAM Symposium on Discrete Algorithms (SODA)","element":"span"},{"text":", pages 16872–16876. ACM Press, 2012.","element":"span"}],[{"id":"id-33","text":"[20] R. Latała. Estimation of moments of sums of independent real random variables. ","element":"span"},{"style":{"fontStyle":"italic"},"text":"Annals of Probability","element":"span"},{"text":", 25(3):1502–1513, 1997.","element":"span"}],[{"id":"id-32","text":"[21] R. Latała. Tail and moment estimates for some types of chaos. ","element":"span"},{"style":{"fontStyle":"italic"},"text":"Studia Mathematica","element":"span"},{"text":", 135(1):39–53, 1999.","element":"span"}],[{"id":"id-13","text":"[22] P. Li, T. Hastie, and K. Church. ","element":"span"},{"text":"Very sparse random projections. ","element":"span"},{"text":"In ","element":"span"},{"style":{"fontStyle":"italic"},"text":"Proceedings of the 12th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining","element":"span"},{"text":", KDD ’06, pages 287–296, 2006.","element":"span"}],[{"id":"id-23","text":"[23] C. Ma, J. Jung, S. Kim, and S. Ko. Random projection-based partial feature extraction for robust face ","element":"span"},{"text":"recognition. ","element":"span"},{"style":{"fontStyle":"italic"},"text":"Neurocomputing","element":"span"},{"text":", 149:1232 – 1244, 2015.","element":"span"}],[{"id":"id-29","text":"[24] J. Nelson and H.L. Nguyen. OSNAP: Faster numerical linear algebra algorithms via sparser subspace ","element":"span"},{"text":"embeddings. In ","element":"span"},{"style":{"fontStyle":"italic"},"text":"Foundations of Computer Science (FOCS), 2013 IEEE 54th Annual Symposium on","element":"span"},{"text":", pages 117–126, 2013.","element":"span"}],[{"text":"[25] J. Nelson and H.L. Nguyen. Sparsity lower bounds for dimensionality reducing maps. In ","element":"span"},{"style":{"fontStyle":"italic"},"text":"Proceedings of the 45th Annual ACM Symposium on Theory of Computing (STOC)","element":"span"},{"text":", pages 101–110, 2013.","element":"span"}],[{"id":"id-43","text":"[26] D. Newman. Bag of words data set. ","element":"span"},{"href":"https://archive.ics.uci.edu/ml/datasets/Bag+of+Words","style":{"fontFamily":"monospace"},"text":"https://archive.ics.uci.edu/ml/datasets/Bag+of+Words","element":"a"},{"text":", 2008.","element":"span"}],[{"id":"id-22","text":"[27] H. Song. Robust visual tracking via online informative feature selection. ","element":"span"},{"style":{"fontStyle":"italic"},"text":"Electronics Letters","element":"span"},{"text":", 50(25):1931– 1932, 2014.","element":"span"}],[{"id":"id-2","text":"[28] S. Suthaharan. ","element":"span"},{"style":{"fontStyle":"italic"},"text":"Machine Learning Models and Algorithms for Big Data Classification: Thinking with Examples for Effective Learning","element":"span"},{"text":", volume 36 of ","element":"span"},{"style":{"fontStyle":"italic"},"text":"Integrated Series in Information Systems","element":"span"},{"text":". Springer US, Boston, MA, 2016.","element":"span"}],[{"id":"id-1","text":"[29] K. Weinberger, A. Dasgupta, J. Langford, A. Smola, and J. Attenberg. Feature hashing for large scale ","element":"span"},{"text":"multitask learning. In ","element":"span"},{"style":{"fontStyle":"italic"},"text":"Proceedings of the 26th Annual International Conference on Machine Learning (ICML)","element":"span"},{"text":", pages 1113–1120, 2009.","element":"span"}]]},{"heading":"APPENDIX","paragraphs":[[{"text":"In Appendix ","element":"span"},{"text":"A, ","element":"span"},{"text":"we prove our corollary regarding dimension-sparsity tradeoffs and discuss some of the subtleties of Theorem ","element":"span"},{"href":"#id-25","text":"1.5. ","element":"a"},{"text":"In Appendix ","element":"span"},{"text":"B, ","element":"span"},{"text":"we show that the Hanson-Wright bound is too loose to prove Theorem ","element":"span"},{"href":"#id-25","text":"1.5. ","element":"a"},{"text":"In Appendix ","element":"span"},{"text":"C, ","element":"span"},{"text":"we state and prove useful moment bounds that we use throughout the analysis. In Appendix ","element":"span"},{"text":"D, ","element":"span"},{"text":"we prove our moment bounds for ","element":"span"},{"style":{"height":16},"width":250.02,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-0.png","element":"img","alt":" Zr(x1, . . . , xn)","inline":true,"padRight":true},{"text":"in Lemma ","element":"span"},{"href":"#id-34","text":"2.1 ","element":"a"},{"text":"and Lemma ","element":"span"},{"href":"#id-35","text":"2.2. ","element":"a"},{"text":"In Appendix ","element":"span"},{"text":"E, ","element":"span"},{"text":"we prove our moment bounds for ","element":"span"},{"style":{"height":16},"width":235.74,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-1.png","element":"img","alt":" R(x1, . . . , xn)","inline":true,"padRight":true},{"text":"in Lemma ","element":"span"},{"href":"#id-36","text":"2.3 ","element":"a"},{"text":"and Lemma ","element":"span"},{"href":"#id-37","text":"2.4. ","element":"a"},{"text":"In Appendix ","element":"span"},{"text":"F, ","element":"span"},{"text":"we prove auxiliary lemmas needed in the proof of Lemma ","element":"span"},{"href":"#id-36","text":"2.3. ","element":"a"},{"text":"In Appendix ","element":"span"},{"text":"G, ","element":"span"},{"text":"we prove auxiliary lemmas needed in the proof of Lemma ","element":"span"},{"href":"#id-37","text":"2.4. ","element":"a"},{"text":"In Appendix ","element":"span"},{"text":"H, ","element":"span"},{"text":"we prove our simplified moment bounds for ","element":"span"},{"style":{"height":16},"width":235.74,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-2.png","element":"img","alt":" R(x1, . . . , xn)","inline":true,"padRight":true},{"text":"in Lemma ","element":"span"},{"href":"#id-38","text":"3.1 ","element":"a"},{"text":"and Lemma ","element":"span"},{"href":"#id-39","text":"3.2. ","element":"a"},{"text":"In Appendix ","element":"span"},{"text":"I, ","element":"span"},{"text":"we provide additional experimental results on real-world and synthetic datasets as well as additional discussion.","element":"span"}]]},{"heading":"A Discussion of Theoretical Results","paragraphs":[[{"text":"We discuss some of the subtleties of Theorem ","element":"span"},{"href":"#id-25","text":"1.5. ","element":"a"},{"text":"When ","element":"span"},{"style":{"height":20.2},"width":697.48,"height":50.49,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-3.png","element":"img","alt":" m ≥ min(2ϵ−2ep, ϵ−2peΘ(max(1,pϵ−1/s)))","inline":true},{"text":", where ","element":"span"},{"style":{"height":16},"width":210.52,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-4.png","element":"img","alt":"p = ln(1/δ)","inline":true},{"text":", we show that ","element":"span"},{"style":{"height":16},"width":278.44,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-5.png","element":"img","alt":" v(m, ϵ, δ, s) = 1","inline":true},{"text":", which means that the norm-preserving condition holds on the full space. This generalizes Cohen’s bound ","element":"span"},{"href":"#id-15","referenceIndex":8,"text":"[8] ","element":"a"},{"text":"to a slightly more general family of sparse JL distributions, as we discuss below. When ","element":"span"},{"style":{"height":17.39},"width":347.58,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-6.png","element":"img","alt":" m ≤ Θ(ϵ−2 ln(1/δ))","inline":true},{"text":", we show that ","element":"span"},{"style":{"height":16},"width":272.94,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-7.png","element":"img","alt":" v(m, ϵ, δ, s) = 0","inline":true},{"text":". For the remaining regimes, ","element":"span"},{"style":{"height":28.8},"width":313.94,"height":72,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-8.png","element":"img","alt":"√ϵs�ln( mϵ2p )/√p","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":29},"width":612.5,"height":72.5,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-9.png","element":"img","alt":" √ϵs min�ln( mϵp )/p,�ln( mϵ2p )/√p�","inline":true},{"text":", our upper and lower bounds on ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-10.png","element":"img","alt":" v(m, ϵ, δ, s)","inline":true,"padRight":true},{"text":"match up to constant factors.","element":"span"}],[{"text":"In terms of the boundaries between regimes, we emphasize that in Theorem ","element":"span"},{"href":"#id-25","text":"1.5, ","element":"a"},{"text":"the function ","element":"span"},{"style":{"height":16},"width":206.46,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-11.png","element":"img","alt":" f ′(m, ϵ, δ, s)","inline":true,"padRight":true},{"text":"may not be defined for certain intervals between the boundaries of regimes, since there may be different absolute constants in different boundaries. ","element":"span"},{"text":"More specifically, these intervals are ","element":"span"},{"style":{"height":16.59},"width":433.68,"height":41.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-12.png","element":"img","alt":" C1ϵ−2p ≤ m ≤ C2ϵ−2p","inline":true},{"text":", ","element":"span"},{"style":{"height":15.79},"width":418.67,"height":39.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-13.png","element":"img","alt":"ϵ−2eC1p ≤ m ≤ 2ϵ−2ep","inline":true},{"text":", and ","element":"span"},{"style":{"height":18.6},"width":817.17,"height":46.49,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-14.png","element":"img","alt":" s · eC1 max(1,pϵ−1/s) ≤ m ≤ s · eC2 max(1,pϵ−1/s)","inline":true},{"text":". These gaps arise because the boundaries between the regimes on our upper and lower bounds on ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-15.png","element":"img","alt":" v(m, ϵ, δ, s)","inline":true,"padRight":true},{"text":"can have different absolute constants, so we don’t have precise control on ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-16.png","element":"img","alt":" v(m, ϵ, δ, s)","inline":true,"padRight":true},{"text":"in these gaps. Nonetheless, the gaps only span a constant factor range on the exponent in the dimension ","element":"span"},{"style":{"fontStyle":"italic"},"text":"m","element":"span"},{"text":".","element":"span"}],[{"text":"We now state the dimension-sparsity tradeoffs that follow from our bounds:","element":"span"}],[{"id":"id-26","style":{"fontWeight":"bold"},"text":"Corollary A.1 ","element":"span"},{"text":"Suppose that ","element":"span"},{"style":{"height":0},"width":20,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-17.png","element":"img","alt":" ϵ","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":11.6},"width":19,"height":29,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-18.png","element":"img","alt":" δ","inline":true,"padRight":true},{"text":"are sufficiently small and ","element":"span"},{"style":{"height":16},"width":145.72,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-19.png","element":"img","alt":" s ≤ m/e","inline":true},{"text":". If ","element":"span"},{"style":{"height":16.39},"width":114.05,"height":40.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-20.png","element":"img","alt":" As,m,n","inline":true,"padRight":true},{"text":"is any sparse JL distribution, then ","element":"span"},{"style":{"height":16},"width":268.83,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-21.png","element":"img","alt":" v(m, ϵ, δ, s) = 1","inline":true,"padRight":true},{"text":"when ","element":"span"},{"style":{"height":28.8},"width":895.37,"height":72,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-22.png","element":"img","alt":" m ≥ min�2ϵ−2/δ, ϵ−2 ln(1/δ)eΘ(max(1,ln(1/δ)ϵ−1/s))�","inline":true},{"text":". If ","element":"span"},{"style":{"height":16.39},"width":114.05,"height":40.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-23.png","element":"img","alt":" As,m,n","inline":true,"padRight":true},{"text":"is a uniform sparse","element":"span"}],[{"text":"JL distribution, then ","element":"span"},{"style":{"height":16},"width":304.71,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-24.png","element":"img","alt":" v(m, ϵ, δ, s) ≤ 1/2","inline":true,"padRight":true},{"text":"when ","element":"span"},{"style":{"height":28.8},"width":1003.7,"height":72,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-25.png","element":"img","alt":" m ≤ min�ϵ−2eΘ(ln(1/δ)), ϵ−2 ln(1/δ)eΘ(max(1,ln(1/δ)ϵ−1/s))�","inline":true},{"text":", apart from a constant-factor interval ","element":"span"},{"style":{"height":17.39},"width":640.22,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-26.png","element":"img","alt":" C1ϵ−2 ln(1/δ) ≤ m ≤ C2ϵ−2 ln(1/δ)","inline":true,"padRight":true},{"text":"where we do not have a bound on the behavior of sparse JL.","element":"span"}],[{"style":{"fontStyle":"italic"},"text":"Proof of Corollary ","element":"span"},{"href":"#id-26","style":{"fontStyle":"italic"},"text":"A.","element":"a"},{"text":"1","element":"span"},{"style":{"fontStyle":"italic"},"text":". ","element":"span"},{"text":"The first statement follows from the fact the lower bound in Theorem ","element":"span"},{"href":"#id-25","text":"1.5 ","element":"a"},{"text":"holds for any sparse JL distribution. For the upper bound, we also use Theorem ","element":"span"},{"href":"#id-25","text":"1.5. ","element":"a"},{"text":"Let’s set ","element":"span"},{"style":{"height":30.37},"width":328.35,"height":75.94,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-27.png","element":"img","alt":" Cv√ϵs√ln(mϵ2√p = 12","inline":true},{"text":", where ","element":"span"},{"style":{"height":13.19},"width":44.48,"height":32.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-28.png","element":"img","alt":" Cv","inline":true}],[{"text":"is the implicit constant in the upper bound. This solves to ","element":"span"},{"style":{"height":16.59},"width":186.13,"height":41.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-29.png","element":"img","alt":" m = ϵ−2pe","inline":true}],[{"text":"We also have the condition that ","element":"span"},{"style":{"height":16.58},"width":324.76,"height":41.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-30.png","element":"img","alt":" m ≤ ϵ−2eΘ(ln(1/δ))","inline":true,"padRight":true},{"text":"for this regime to be reached. We can obtain the ","element":"span"},{"text":"max ","element":"span"},{"text":"with ","element":"span"},{"text":"1 ","element":"span"},{"text":"on the exponent, by using that ","element":"span"},{"style":{"height":16},"width":264.89,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-31.png","element":"img","alt":" v(m, ϵ, δ, s) = 0","inline":true,"padRight":true},{"text":"when ","element":"span"},{"style":{"height":17.38},"width":339.5,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-32.png","element":"img","alt":" m ≤ Θ(ϵ−2 ln(1/δ))","inline":true},{"text":". To avoid having a gap when ","element":"span"},{"style":{"height":16.2},"width":486.26,"height":40.49,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-33.png","element":"img","alt":"m = s·eΘ(max(1,ln(1/δ)ϵ−1/s))","inline":true},{"text":", we implicitly use that our lower bound actually doesn’t have a gap between these regimes (though there may be a gap in the boundary between the lower bound and upper bound). Thus, we only have to keep the gap ","element":"span"},{"style":{"height":17.38},"width":612.23,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-34.png","element":"img","alt":" C1ϵ−2 ln(1/δ) ≤ m ≤ C2ϵ−2 ln(1/δ)","inline":true,"padRight":true},{"text":"where we do not have a lower bound.","element":"span"}],[{"text":"Notice that the upper and lower bounds in Corollary ","element":"span"},{"href":"#id-26","style":{"fontStyle":"italic"},"text":"A.","element":"a"},{"text":"1 ","element":"span"},{"text":"also match up to constant factors on the exponent in the dimension ","element":"span"},{"style":{"fontStyle":"italic"},"text":"m","element":"span"},{"text":".","element":"span"}]]},{"heading":"B Hanson-Wright is too loose even for s = 1","paragraphs":[[{"text":"Though Cohen, Jayram, and Nelson ","element":"span"},{"href":"#id-30","referenceIndex":9,"text":"[9] ","element":"a"},{"text":"also view ","element":"span"},{"style":{"height":16},"width":235.74,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-35.png","element":"img","alt":" R(x1, . . . , xn)","inline":true,"padRight":true},{"text":"as a quadratic form, we show that their approach is not sufficiently precise for our setting. They upper bound the moments of ","element":"span"},{"style":{"height":16},"width":235.74,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/11-36.png","element":"img","alt":" R(x1, . . . , xn)","inline":true,"padRight":true},{"text":"by the","element":"span"}],[{"text":"gaussian case through considering:","element":"span"}],[{"style":{"width":"39%"},"width":755,"height":117,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-0.png","element":"img"}],[{"text":"where the ","element":"span"},{"style":{"height":11.59},"width":53.38,"height":28.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-1.png","element":"img","alt":" gr,i","inline":true,"padRight":true},{"text":"are i.i.d standard gaussians. They use the fact Rademachers are subgaussian to conclude that ","element":"span"},{"style":{"height":32.69},"width":654.54,"height":81.72,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-2.png","element":"img","alt":"∥R(x1, . . . , xn)∥q ≤�� ˜R(x1, . . . , xn)��q","inline":true},{"text":". In order to obtain upper bounds on","element":"span"},{"style":{"height":32.69},"width":294.52,"height":81.72,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-3.png","element":"img","alt":"�� ˜R(x1, . . . , xn)��q","inline":true},{"text":", they use the ","element":"span"},{"text":"Hanson-Wright bound, a tight bound on moments of gaussian quadratic forms. However, we need different technical tools for two reasons.","element":"span"}],[{"text":"1. First, in order to upper bound ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-4.png","element":"img","alt":" v(m, ϵ, δ, s)","inline":true},{"text":", we need to ","element":"span"},{"style":{"height":19.18},"width":527.78,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-5.png","element":"img","alt":" lower bound ∥|R(x1, . . . , xn)∥q","inline":true},{"text":", and thus cannot simply consider","element":"span"},{"style":{"height":32.69},"width":294.52,"height":81.72,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-6.png","element":"img","alt":"�� ˜R(x1, . . . , xn)��q","inline":true},{"text":".","element":"span"}],[{"text":"2. Second, even to lower bound ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-7.png","element":"img","alt":" v(m, ϵ, δ, s)","inline":true},{"text":", using","element":"span"},{"style":{"height":32.69},"width":294.52,"height":81.72,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-8.png","element":"img","alt":"�� ˜R(x1, . . . , xn)��q","inline":true,"padRight":true},{"text":"as a upper bound for ","element":"span"},{"style":{"height":19.18},"width":290.09,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-9.png","element":"img","alt":" ∥R(x1, . . . , xn)∥q","inline":true,"padRight":true},{"text":"is not sufficiently strong. Below, we give a counter-example, i.e. a vector ","element":"span"},{"style":{"fontStyle":"italic"},"text":"x","element":"span"},{"text":", where","element":"span"},{"style":{"height":32.69},"width":294.52,"height":81.72,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-10.png","element":"img","alt":"�� ˜R(x1, . . . , xn)��q","inline":true,"padRight":true},{"text":"is ","element":"span"},{"text":"too large to recover a tight lower bound.","element":"span"}],[{"text":"Thus, we cannot use the Hanson-Wright bound in this setting, and need to come up with a better bound on ","element":"span"},{"style":{"height":19.18},"width":290.09,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-11.png","element":"img","alt":"∥R(x1, . . . , xn)∥q","inline":true,"padRight":true},{"text":"that does not implicitly replace Rademachers by gaussians. The second point is similar in flavor to the conceptual point made in ","element":"span"},{"href":"#id-31","referenceIndex":14,"text":"[14]","element":"a"},{"text":", where a sign-consistent variant of sparse JL was analyzed using an ","element":"span"},{"style":{"fontStyle":"italic"},"text":"upper ","element":"span"},{"text":"bound for Rademacher quadratic forms. However, the bound in ","element":"span"},{"href":"#id-31","referenceIndex":14,"text":"[14] ","element":"a"},{"text":"also turns out to be loose in this setting and also can’t be used to obtain either a sufficiently tight upper bound or a lower bound for ","element":"span"},{"style":{"height":16},"width":235.74,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-12.png","element":"img","alt":"R(x1, . . . , xn)","inline":true},{"text":".","element":"span"}],[{"text":"We now show point (2): that the Hanson-Wright bound is not sufficiently strong to obtain a lower bound ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-13.png","element":"img","alt":"v(m, ϵ, δ, s)","inline":true},{"text":". We consider ","element":"span"},{"style":{"height":22.01},"width":842.01,"height":55.03,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-14.png","element":"img","alt":"˜R(x1, . . . , xn) = 1s�mr=1�i̸=j ηr,iηr,jgr,igr,jxixj","inline":true},{"text":", as above, where the ","element":"span"},{"style":{"height":11.59},"width":53.39,"height":28.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-15.png","element":"img","alt":" gr,i","inline":true,"padRight":true},{"text":"are i.i.d ","element":"span"},{"text":"standard gaussians. We consider ","element":"span"},{"style":{"fontStyle":"italic"},"text":"p ","element":"span"},{"text":"equal to ","element":"span"},{"style":{"height":16},"width":123.78,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-16.png","element":"img","alt":" ln(1/δ)","inline":true,"padRight":true},{"text":"rounded up to the nearest even integer, and we consider a vector of the form ","element":"span"},{"text":"[","element":"span"},{"style":{"fontStyle":"italic"},"text":"v, . . . , v, ","element":"span"},{"text":"0","element":"span"},{"style":{"fontStyle":"italic"},"text":", . . . , ","element":"span"},{"text":"0] ","element":"span"},{"text":"where ","element":"span"},{"style":{"height":19.37},"width":30.95,"height":48.43,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-17.png","element":"img","alt":"1v2","inline":true,"padRight":true},{"text":"is an integer and ","element":"span"},{"style":{"height":13.2},"width":93.88,"height":33,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-18.png","element":"img","alt":" v ≥ 0","inline":true},{"text":". We show","element":"span"},{"style":{"height":32.69},"width":527.47,"height":81.72,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-19.png","element":"img","alt":"�� ˜R(v, . . . , v, 0, . . . , 0)��p ≳ ω(ϵ)","inline":true,"padRight":true},{"text":"for a certain ","element":"span"},{"style":{"fontStyle":"italic"},"text":"v ","element":"span"},{"text":"value, where we know it to be true that ","element":"span"},{"style":{"height":19.18},"width":469.13,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-20.png","element":"img","alt":" ∥R(v, . . . , v, 0, . . . , 0)∥p ≲ ϵ","inline":true},{"text":".","element":"span"}],[{"text":"Let’s consider a vector ","element":"span"},{"text":"[","element":"span"},{"style":{"fontStyle":"italic"},"text":"v, . . . , v, ","element":"span"},{"text":"0","element":"span"},{"style":{"fontStyle":"italic"},"text":", . . . , ","element":"span"},{"text":"0] ","element":"span"},{"text":"where ","element":"span"},{"style":{"height":19.37},"width":30.94,"height":48.43,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-21.png","element":"img","alt":"1v2","inline":true,"padRight":true},{"text":"is an integer and ","element":"span"},{"style":{"height":13.2},"width":98.2,"height":33,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-22.png","element":"img","alt":" v ≥ 0","inline":true},{"text":". We apply the Hanson-Wright ","element":"span"},{"text":"bound (which is tight for gaussians) to obtain:","element":"span"}],[{"style":{"width":"63%"},"width":1213,"height":320,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-23.png","element":"img"}],[{"text":"Let ","element":"span"},{"style":{"height":20.4},"width":255.53,"height":51.01,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-24.png","element":"img","alt":" M = �Ni=1 η1,i","inline":true},{"text":". Let ","element":"span"},{"style":{"height":16},"width":139.24,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-25.png","element":"img","alt":" S ⊆ [N]","inline":true,"padRight":true},{"text":"be the set of indices where ","element":"span"},{"style":{"height":15.59},"width":132.47,"height":38.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-26.png","element":"img","alt":" η1,i = 1","inline":true},{"text":". We can set the vector to ","element":"span"},{"style":{"height":22.73},"width":239.96,"height":56.83,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-27.png","element":"img","alt":" xi = yi = 1√M","inline":true,"padRight":true},{"text":"for all ","element":"span"},{"style":{"height":11.6},"width":88.43,"height":29,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-28.png","element":"img","alt":" i ∈ S","inline":true,"padRight":true},{"text":"and ","element":"span"},{"text":"0 ","element":"span"},{"text":"elsewhere. This gives us:","element":"span"}],[{"style":{"width":"82%"},"width":1578,"height":153,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-29.png","element":"img"}],[{"text":"We can expand out this moment to obtain:","element":"span"}],[{"style":{"width":"71%"},"width":1361,"height":394,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/12-30.png","element":"img"}],[{"text":"Since ","element":"span"},{"style":{"height":14},"width":137.32,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-0.png","element":"img","alt":" M ≤ p","inline":true},{"text":", we know that","element":"span"},{"style":{"height":22.7},"width":207.16,"height":56.76,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-1.png","element":"img","alt":"� pM�M ≥ 1","inline":true},{"text":". ","element":"span"},{"text":"Moreover, as long as ","element":"span"},{"style":{"height":16.57},"width":156.36,"height":41.43,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-2.png","element":"img","alt":" p ≥ semv2","inline":true,"padRight":true},{"text":", we know that","element":"span"},{"style":{"height":23.5},"width":261.07,"height":58.76,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-3.png","element":"img","alt":"�1 − sm�M/p ≥","inline":true},{"style":{"height":23.51},"width":539.71,"height":58.76,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-4.png","element":"img","alt":"�1 − sm�N/p ≥�1 − sm� ms ≥ 0.3","inline":true},{"text":". Thus we obtain a bound of","element":"span"}],[{"style":{"width":"80%"},"width":1536,"height":412,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-5.png","element":"img"}],[{"text":"We show that when ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"= 1","element":"span"},{"text":", the bound ","element":"span"},{"style":{"height":26.63},"width":234.48,"height":66.57,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-6.png","element":"img","alt":" v = √ϵln( mϵp )p","inline":true,"padRight":true},{"text":"will produce ","element":"span"},{"style":{"height":19.18},"width":532.14,"height":47.95,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-7.png","element":"img","alt":" ∥R(v, . . . , v, 0, . . . , 0)∥p ≳ ω(ϵ)","inline":true},{"text":". At this ","element":"span"},{"style":{"fontStyle":"italic"},"text":"v ","element":"span"},{"text":"value, we know that:","element":"span"}],[{"style":{"width":"88%"},"width":1693,"height":326,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-8.png","element":"img"}]]},{"heading":"C Useful Moment Bounds","paragraphs":[[{"text":"The key quadratic form bound for Rademachers that we use is:","element":"span"}],[{"id":"id-46","style":{"fontWeight":"bold"},"text":"Lemma C.1 ","element":"span"},{"text":"Let ","element":"span"},{"style":{"fontStyle":"italic"},"text":"T ","element":"span"},{"text":"be an even integer, ","element":"span"},{"style":{"height":19.18},"width":172.86,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-9.png","element":"img","alt":" {σi}1≤i≤n","inline":true,"padRight":true},{"text":"be independent Rademachers, and ","element":"span"},{"style":{"height":16.79},"width":212.89,"height":41.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-10.png","element":"img","alt":" (Yi,j)1≤i,j≤n","inline":true,"padRight":true},{"text":"be a ","element":"span"},{"style":{"height":8},"width":95.15,"height":20,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-11.png","element":"img","alt":" n × n","inline":true,"padRight":true},{"text":"symmetric, nonnegative random matrix with zero diagonal (i.e. ","element":"span"},{"style":{"height":15.59},"width":130.3,"height":38.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-12.png","element":"img","alt":" Yi,i = 0","inline":true},{"text":") such that ","element":"span"},{"style":{"height":19.76},"width":221.75,"height":49.4,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-13.png","element":"img","alt":" {Yi,j}1≤i,j≤n","inline":true,"padRight":true},{"text":"is independent from ","element":"span"},{"style":{"height":19.18},"width":172.86,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-14.png","element":"img","alt":" {σi}1≤i≤n","inline":true},{"text":". If ","element":"span"},{"style":{"height":28.8},"width":351.64,"height":72,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-15.png","element":"img","alt":" Wi =��1≤j≤n Y 2i,j","inline":true},{"text":", then:","element":"span"}],[{"style":{"width":"92%"},"width":1765,"height":148,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-16.png","element":"img"}],[{"text":"where ","element":"span"},{"style":{"fontStyle":"italic"},"text":"W","element":"span"},{"style":{"height":16.48},"width":218.41,"height":41.19,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-17.png","element":"img","alt":"(1) ≥ W(2) ≥","inline":true,"padRight":true},{"style":{"fontStyle":"italic"},"text":". . . ","element":"span"},{"style":{"height":12.8},"width":31,"height":32,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-18.png","element":"img","alt":" ≥","inline":true,"padRight":true},{"style":{"fontStyle":"italic"},"text":". . . W","element":"span"},{"style":{"height":11.2},"width":44.16,"height":28,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-19.png","element":"img","alt":"(n)","inline":true,"padRight":true},{"text":"is a permutation of ","element":"span"},{"style":{"fontStyle":"italic"},"text":"W","element":"span"},{"style":{"height":7.6},"width":16,"height":19,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-20.png","element":"img","alt":"1","inline":true},{"style":{"fontStyle":"italic"},"text":", . . . , W","element":"span"},{"style":{"height":4.8},"width":20,"height":12,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-21.png","element":"img","alt":"n","inline":true},{"text":".","element":"span"}],[{"text":"We derive Lemma ","element":"span"},{"href":"#id-46","text":"C.1 ","element":"a"},{"text":"from Latała’s bound on Rademacher quadratic forms ","element":"span"},{"href":"#id-32","referenceIndex":21,"text":"[21]","element":"a"},{"text":". In fact, Latała shows moment bounds for much more general quadratic forms, but for the application to JL, we only need the following bound in the special case of Rademachers:","element":"span"}],[{"id":"id-47","style":{"fontWeight":"bold"},"text":"Lemma C.2 (","element":"span"},{"href":"#id-32","referenceIndex":21,"style":{"fontWeight":"bold"},"text":"[21]","element":"a"},{"style":{"fontWeight":"bold"},"text":") ","element":"span"},{"text":"Let ","element":"span"},{"style":{"fontStyle":"italic"},"text":"T ","element":"span"},{"text":"be an even natural number. Let ","element":"span"},{"style":{"height":10},"width":171.97,"height":25,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-22.png","element":"img","alt":" σ1, . . . , σn","inline":true,"padRight":true},{"text":"be independent Rademachers and let ","element":"span"},{"style":{"height":16.79},"width":90.09,"height":41.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-23.png","element":"img","alt":"(ai,j)","inline":true,"padRight":true},{"text":"a symmetric matrix with zero diagonal. Then:","element":"span"}],[{"style":{"width":"90%"},"width":1722,"height":147,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-24.png","element":"img"}],[{"text":"where ","element":"span"},{"style":{"fontStyle":"italic"},"text":"A","element":"span"},{"style":{"height":28.8},"width":248.81,"height":72,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-25.png","element":"img","alt":"i =��1≤j≤n","inline":true,"padRight":true},{"style":{"fontStyle":"italic"},"text":"a","element":"span"},{"style":{"height":19.93},"width":33.72,"height":49.83,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-26.png","element":"img","alt":"2i,j","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"fontStyle":"italic"},"text":"A","element":"span"},{"style":{"height":17.28},"width":166.14,"height":43.2,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-27.png","element":"img","alt":"(1) ≥ A(2)","inline":true,"padRight":true},{"style":{"fontStyle":"italic"},"text":". . . ","element":"span"},{"style":{"height":12.8},"width":31,"height":32,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-28.png","element":"img","alt":" ≥","inline":true,"padRight":true},{"style":{"fontStyle":"italic"},"text":". . . A","element":"span"},{"style":{"height":11.2},"width":44.16,"height":28,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-29.png","element":"img","alt":"(n)","inline":true,"padRight":true},{"text":"is a permutation of ","element":"span"},{"style":{"fontStyle":"italic"},"text":"A","element":"span"},{"style":{"height":7.6},"width":16,"height":19,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-30.png","element":"img","alt":"1","inline":true},{"style":{"fontStyle":"italic"},"text":", . . . , A","element":"span"},{"style":{"height":4.8},"width":20,"height":12,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-31.png","element":"img","alt":"n","inline":true},{"text":".","element":"span"}],[{"text":"To prove Lemma ","element":"span"},{"href":"#id-46","style":{"fontStyle":"italic"},"text":"C.","element":"a"},{"text":"1","element":"span"},{"text":", we apply Lemma ","element":"span"},{"href":"#id-47","style":{"fontStyle":"italic"},"text":"C.","element":"a"},{"text":"2 ","element":"span"},{"text":"to the case where the ","element":"span"},{"style":{"height":11.59},"width":54.79,"height":28.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/13-32.png","element":"img","alt":" ai,j","inline":true,"padRight":true},{"text":"are themselves random variables:","element":"span"}],[{"style":{"width":"94%"},"width":1804,"height":657,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/14-0.png","element":"img"}],[{"text":"where the last line follows from the fact that the the ","element":"span"},{"style":{"height":15.59},"width":56.86,"height":38.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/14-1.png","element":"img","alt":" Yi,j","inline":true,"padRight":true},{"text":"are nonnegative, so each term is nonnegative, so the triangle inequality results in at most a factor of ","element":"span"},{"text":"2 ","element":"span"},{"text":"of gain.","element":"span"}],[{"text":"Now, we consider linear forms of symmetric random variables. Theoretically, moments of these forms can be derived from Theorem 2 in ","element":"span"},{"href":"#id-33","referenceIndex":20,"text":"[20] ","element":"a"},{"text":"(a tight bound on moments of weighted sums of symmetric random variables). However, reducing the tight bound to the form that we want would require some simplifications. Instead, we give a direct proof of a weaker bound that is sufficiently tight for our setting.","element":"span"}],[{"id":"id-48","style":{"fontWeight":"bold"},"text":"Proposition C.3 ","element":"span"},{"text":"Suppose that ","element":"span"},{"style":{"height":13.2},"width":104.38,"height":33,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/14-2.png","element":"img","alt":" T ≥ 1","inline":true,"padRight":true},{"text":"is an integer. Suppose that ","element":"span"},{"style":{"height":14},"width":231.43,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/14-3.png","element":"img","alt":" Y1, Y2, . . . , Yn","inline":true,"padRight":true},{"text":"are i.i.d symmetric random variables and suppose that ","element":"span"},{"style":{"height":16},"width":271.66,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/14-4.png","element":"img","alt":" x = [x1, . . . , xn]","inline":true,"padRight":true},{"text":"satisfies ","element":"span"},{"style":{"height":16.78},"width":153.63,"height":41.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/14-5.png","element":"img","alt":" ∥x∥2 ≤ 1","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":16.78},"width":168.52,"height":41.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/14-6.png","element":"img","alt":" ∥x∥∞ ≤ v","inline":true},{"text":". Then, we have that","element":"span"}],[{"style":{"width":"42%"},"width":812,"height":124,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/14-7.png","element":"img"}],[{"style":{"fontStyle":"italic"},"text":"Proof of Proposition ","element":"span"},{"href":"#id-48","style":{"fontStyle":"italic"},"text":"C.","element":"a"},{"text":"3","element":"span"},{"style":{"fontStyle":"italic"},"text":". ","element":"span"},{"text":"Let ","element":"span"},{"style":{"height":28.8},"width":680.59,"height":72,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/14-8.png","element":"img","alt":" k = 2v�sup1≤t≤TTt� 1T v2�1/(2t) ∥Yi∥2t�","inline":true},{"text":". Observe that","element":"span"}],[{"style":{"width":"74%"},"width":1428,"height":573,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/14-9.png","element":"img"}],[{"text":"Now, we use the fact that ","element":"span"},{"style":{"height":16},"width":130.32,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/14-10.png","element":"img","alt":" |xi| ≤ v","inline":true,"padRight":true},{"text":"and the condition on ","element":"span"},{"style":{"fontStyle":"italic"},"text":"k ","element":"span"},{"text":"to obtain that this is bounded by","element":"span"}],[{"style":{"width":"89%"},"width":1704,"height":200,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/14-11.png","element":"img"}],[{"text":"We now bound moments of squares of linear forms with a zero diagonal, i.e. ","element":"span"},{"style":{"height":19.13},"width":249.38,"height":47.84,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/14-12.png","element":"img","alt":"�i̸=j YiYjxixj","inline":true},{"text":". This structure ","element":"span"},{"text":"of random variable theoretically falls under the scope of Lemma ","element":"span"},{"href":"#id-46","text":"C.1. ","element":"a"},{"text":"However, as mentioned in Section 2.1, the first term of ","element":"span"},{"href":"#id-46","text":"C.1, ","element":"a"},{"text":"which is an operator-norm-like term for an asymmetric random matrix in this setting, becomes intractable to manage. We give an alternate (weaker) upper bound that is both tractable to analyze and sufficiently tight for our setting. Our proof of this bound is similar to our proof of Proposition ","element":"span"},{"href":"#id-48","text":"C.3 ","element":"a"},{"text":"presented above. Since random variables with a zero diagonal are common in the JL literature ","element":"span"},{"href":"#id-10","referenceIndex":19,"text":"[19, ","element":"a"},{"href":"#id-28","referenceIndex":3,"text":"3, ","element":"a"},{"href":"#id-29","referenceIndex":24,"text":"24]","element":"a"},{"text":", we believe this ","element":"span"},{"id":"id-49","text":"moment bound could be of broader use.","element":"span"}],[{"style":{"fontWeight":"bold"},"text":"Lemma C.4 ","element":"span"},{"text":"Suppose that ","element":"span"},{"style":{"height":14},"width":231.42,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/15-0.png","element":"img","alt":" Y1, Y2, . . . , Yn","inline":true,"padRight":true},{"text":"are i.i.d symmetric random variables and suppose that ","element":"span"},{"style":{"height":16},"width":271.65,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/15-1.png","element":"img","alt":" x = [x1, . . . , xn]","inline":true,"padRight":true},{"text":"satisfies ","element":"span"},{"style":{"height":16.78},"width":153.66,"height":41.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/15-2.png","element":"img","alt":" ∥x∥2 = 1","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":16.78},"width":168.52,"height":41.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/15-3.png","element":"img","alt":" ∥x∥∞ ≤ v","inline":true},{"text":". Let ","element":"span"},{"style":{"fontStyle":"italic"},"text":"T ","element":"span"},{"text":"be an even natural number. Then, we have that","element":"span"}],[{"style":{"width":"49%"},"width":953,"height":147,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/15-4.png","element":"img"}],[{"style":{"fontStyle":"italic"},"text":"Proof of Lemma ","element":"span"},{"href":"#id-49","style":{"fontStyle":"italic"},"text":"C.4. ","element":"a"},{"text":"Let ","element":"span"},{"style":{"height":28.8},"width":711.94,"height":72,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/15-5.png","element":"img","alt":" k = 2v�sup1≤t≤T/2Tt� 1T v2�1/(2t) ∥Yi∥2t�","inline":true},{"text":". Observe that","element":"span"}],[{"style":{"width":"83%"},"width":1593,"height":585,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/15-6.png","element":"img"}],[{"text":"Now, we use the fact that ","element":"span"},{"style":{"height":16},"width":130.32,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/15-7.png","element":"img","alt":" |xi| ≤ v","inline":true,"padRight":true},{"text":"and the condition on ","element":"span"},{"style":{"fontStyle":"italic"},"text":"k ","element":"span"},{"text":"to obtain that this is bounded by","element":"span"}],[{"style":{"width":"89%"},"width":1720,"height":215,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/15-8.png","element":"img"}],[{"text":"Latała ","element":"span"},{"href":"#id-33","referenceIndex":20,"text":"[20] ","element":"a"},{"text":"gives the following nice bound on sums of i.i.d symmetric random variables that we use for combining bounds on rows ","element":"span"},{"style":{"height":16},"width":250.02,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/15-9.png","element":"img","alt":" Zr(x1, . . . , xn)","inline":true,"padRight":true},{"text":"in Lemma ","element":"span"},{"href":"#id-36","text":"2.3.","element":"a"}],[{"id":"id-61","style":{"fontWeight":"bold"},"text":"Lemma C.5 (","element":"span"},{"href":"#id-33","referenceIndex":20,"style":{"fontWeight":"bold"},"text":"[20]","element":"a"},{"style":{"fontWeight":"bold"},"text":") ","element":"span"},{"text":"Suppose that ","element":"span"},{"style":{"fontStyle":"italic"},"text":"q ","element":"span"},{"text":"is an even natural number. Suppose that ","element":"span"},{"style":{"height":14},"width":172.7,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/15-10.png","element":"img","alt":" Y1, . . . , Yn","inline":true,"padRight":true},{"text":"are i.i.d symmetric random variables. Then:","element":"span"}],[{"style":{"width":"33%"},"width":639,"height":115,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/15-11.png","element":"img"}],[{"text":"We give a general lower bound on moments of certain (potentially correlated) sums of identically distributed random variables, that we use in proving Lemma ","element":"span"},{"href":"#id-37","text":"2.4.","element":"a"}],[{"id":"id-50","style":{"fontWeight":"bold"},"text":"Proposition C.6 ","element":"span"},{"text":"Let ","element":"span"},{"style":{"height":14},"width":172.71,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/15-12.png","element":"img","alt":" Y1, . . . , Yn","inline":true,"padRight":true},{"text":"be identically distributed (but not necessarily independent) random variables, such that the joint distribution is a symmetric function of ","element":"span"},{"style":{"height":14},"width":172.7,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/15-13.png","element":"img","alt":" Y1, . . . , Yn","inline":true,"padRight":true},{"text":"and for any integers ","element":"span"},{"style":{"height":14},"width":228.89,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/15-14.png","element":"img","alt":" d1, . . . dn ≥ 0","inline":true},{"text":", it is true that ","element":"span"},{"style":{"height":21.87},"width":327.98,"height":54.67,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/15-15.png","element":"img","alt":" E[�1≤i≤n Y dii ] ≥ 0","inline":true},{"text":". For any natural number ","element":"span"},{"style":{"fontStyle":"italic"},"text":"q ","element":"span"},{"text":"and natural number ","element":"span"},{"style":{"fontStyle":"italic"},"text":"T ","element":"span"},{"text":"that divides ","element":"span"},{"style":{"fontStyle":"italic"},"text":"q","element":"span"},{"text":", it is true that","element":"span"}],[{"style":{"width":"35%"},"width":685,"height":130,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/15-16.png","element":"img"}],[{"style":{"fontStyle":"italic"},"text":"Proof of Proposition ","element":"span"},{"href":"#id-50","style":{"fontStyle":"italic"},"text":"C.6. ","element":"a"},{"text":"The proof follows from expanding ","element":"span"},{"style":{"height":18.46},"width":235.96,"height":46.15,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/15-17.png","element":"img","alt":" E[(�ni=1 Yi)q]","inline":true,"padRight":true},{"text":"and using the fact that ","element":"span"},{"style":{"height":21.87},"width":296.92,"height":54.67,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/15-18.png","element":"img","alt":" E[�1≤i≤n Y dii ] ≥","inline":true,"padRight":true},{"text":"0 ","element":"span"},{"text":"so that we can restrict to a subset of the terms. By the symmetry of the joint distribution, we know that for ","element":"span"},{"style":{"height":15.2},"width":386.66,"height":38,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/15-19.png","element":"img","alt":"1 ≤ r1 ̸= r2 ̸= rT ≤ n","inline":true},{"text":", we know that ","element":"span"},{"style":{"height":21.36},"width":630,"height":53.41,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/15-20.png","element":"img","alt":" E[Y q/Tr1 . . . Y q/TrT ] = E[Y q/T1 . . . Y q/TT ]","inline":true},{"text":". The number of terms of the form ","element":"span"},{"style":{"height":20.68},"width":286.48,"height":51.7,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/15-21.png","element":"img","alt":"E[Y q/Tr1 . . . Y q/TrT ]","inline":true,"padRight":true},{"text":"in ","element":"span"},{"style":{"height":18.46},"width":235.96,"height":46.15,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/15-22.png","element":"img","alt":" E[(�ni=1 Yi)q]","inline":true,"padRight":true},{"text":"is:","element":"span"}],[{"style":{"width":"94%"},"width":1813,"height":112,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/15-23.png","element":"img"}],[{"text":"This implies that","element":"span"}],[{"style":{"width":"44%"},"width":849,"height":116,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/16-0.png","element":"img"}],[{"text":"and the statement follows from taking ","element":"span"},{"text":"1","element":"span"},{"style":{"fontStyle":"italic"},"text":"/q","element":"span"},{"text":"th powers.","element":"span"}],[{"text":"We prove a lemma involving the Paley-Zygmund inequality applied to ","element":"span"},{"style":{"fontStyle":"italic"},"text":"p","element":"span"},{"text":"th moments, that we use implicitly in the proof of the upper bound in Theorem ","element":"span"},{"href":"#id-25","text":"1.5.","element":"a"}],[{"id":"id-51","style":{"fontWeight":"bold"},"text":"Lemma C.7 ","element":"span"},{"text":"Suppose that ","element":"span"},{"style":{"fontStyle":"italic"},"text":"K > ","element":"span"},{"text":"0 ","element":"span"},{"text":"and ","element":"span"},{"style":{"fontStyle":"italic"},"text":"Z ","element":"span"},{"text":"is a nonnegative random variable, such that ","element":"span"},{"style":{"height":19.18},"width":197.44,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/16-1.png","element":"img","alt":" ∥Z∥q ≥ 2K","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":19.18},"width":100.79,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/16-2.png","element":"img","alt":" ∥Z∥2q","inline":true,"padRight":true},{"text":"is finite. Then,","element":"span"}],[{"style":{"width":"27%"},"width":521,"height":122,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/16-3.png","element":"img"}],[{"text":"We use the Paley-Zygmund inequality, which says the following:","element":"span"}],[{"id":"id-52","style":{"fontWeight":"bold"},"text":"Lemma C.8 (Paley-Zygmund) ","element":"span"},{"text":"Suppose that ","element":"span"},{"style":{"fontStyle":"italic"},"text":"Z ","element":"span"},{"text":"is a nonnegative random variable with finite variance. Then,","element":"span"}],[{"style":{"width":"23%"},"width":458,"height":97,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/16-4.png","element":"img"}],[{"style":{"fontStyle":"italic"},"text":"Proof of Lemma ","element":"span"},{"href":"#id-51","style":{"fontStyle":"italic"},"text":"C.","element":"a"},{"text":"7","element":"span"},{"style":{"fontStyle":"italic"},"text":". ","element":"span"},{"text":"We apply Lemma ","element":"span"},{"href":"#id-52","style":{"fontStyle":"italic"},"text":"C.","element":"a"},{"text":"8 ","element":"span"},{"text":"to ","element":"span"},{"style":{"height":10.8},"width":47.06,"height":27,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/16-5.png","element":"img","alt":" Zp","inline":true,"padRight":true},{"text":"to obtain that:","element":"span"}],[{"style":{"width":"47%"},"width":913,"height":129,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/16-6.png","element":"img"}],[{"text":"If ","element":"span"},{"style":{"height":19.18},"width":197.38,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/16-7.png","element":"img","alt":" ∥Z∥p ≥ 2K","inline":true},{"text":", then we know that","element":"span"}],[{"style":{"width":"59%"},"width":1141,"height":45,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/16-8.png","element":"img"}],[{"text":"and then we can apply the above result.","element":"span"}]]},{"heading":"D Proofs of Lemma 2.1 and Lemma 2.2","paragraphs":[[{"text":"We analyze the moments of ","element":"span"},{"style":{"height":16},"width":250.02,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/16-9.png","element":"img","alt":" Zr(x1, . . . , xn)","inline":true},{"text":", proving Lemma ","element":"span"},{"href":"#id-35","text":"2.2 ","element":"a"},{"text":"and Lemma ","element":"span"},{"href":"#id-34","text":"2.1. ","element":"a"},{"text":"Our lower bound in Lemma ","element":"span"},{"href":"#id-35","text":"2.2 ","element":"a"},{"text":"holds for ","element":"span"},{"style":{"height":19.18},"width":391.36,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/16-10.png","element":"img","alt":" ∥Zr(v, . . . , v, 0, . . . , 0∥q","inline":true,"padRight":true},{"text":"as well as","element":"span"},{"style":{"height":30.6},"width":582.8,"height":76.49,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/16-11.png","element":"img","alt":"��Zr(v, . . . , v, 0, . . . , 0)I�1/v2i=1 ηr,i=2","inline":true}],[{"href":"#id-34","style":{"height":31.39},"width":45.14,"height":78.48,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/16-12.png","element":"img","alt":"��T","inline":true,"padRight":true},{"text":"(for technical reasons discussed ","element":"span"},{"text":"in Appendix ","element":"span"},{"text":"E)","element":"span"},{"text":". Our upper bound in Lemma ","element":"span"},{"href":"#id-34","text":"2.1 ","element":"a"},{"text":"holds for ","element":"span"},{"style":{"height":19.18},"width":304.37,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/16-13.png","element":"img","alt":" ∥Zr(x1, . . . , xn)∥q","inline":true},{"text":". In Appendix ","element":"span"},{"href":"#id-53","text":"D.1, ","element":"a"},{"text":"we prove Lemma ","element":"span"},{"href":"#id-35","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"2","element":"span"},{"text":". In Appendix ","element":"span"},{"href":"#id-54","text":"D.2, ","element":"a"},{"text":"we prove Lemma ","element":"span"},{"href":"#id-34","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"1","element":"span"},{"text":".","element":"span"}],[{"id":"id-53","style":{"fontWeight":"bold"},"text":"D.1 ","element":"span"},{"style":{"fontWeight":"bold"},"text":"Proof of Lemma ","element":"span"},{"href":"#id-35","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"2","element":"span"}],[{"text":"The key ingredient of the proof is Lemma ","element":"span"},{"href":"#id-46","style":{"fontStyle":"italic"},"text":"C.","element":"a"},{"text":"1 ","element":"span"},{"text":"(for Rademacher quadratic forms). We can view ","element":"span"},{"style":{"height":16},"width":352.52,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/16-14.png","element":"img","alt":" Zr(v, . . . , v, 0, . . . , 0)","inline":true,"padRight":true},{"text":"as the following quadratic form:","element":"span"}],[{"style":{"width":"44%"},"width":847,"height":92,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/16-15.png","element":"img"}],[{"text":"where ","element":"span"},{"style":{"height":19.37},"width":125.22,"height":48.43,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/16-16.png","element":"img","alt":" N = 1v2","inline":true,"padRight":true},{"text":". Since the support of ","element":"span"},{"style":{"height":11.59},"width":54.17,"height":28.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/16-17.png","element":"img","alt":" ηr,i","inline":true,"padRight":true},{"text":"is ","element":"span"},{"style":{"fontStyle":"italic"},"text":"{","element":"span"},{"text":"0","element":"span"},{"style":{"fontStyle":"italic"},"text":", ","element":"span"},{"text":"1","element":"span"},{"style":{"fontStyle":"italic"},"text":"} ","element":"span"},{"text":"and due to symmetry of this random variable, it is tractable ","element":"span"},{"text":"to analyze the expressions in Lemma ","element":"span"},{"href":"#id-46","style":{"fontStyle":"italic"},"text":"C.","element":"a"},{"text":"1","element":"span"},{"text":".","element":"span"}],[{"style":{"fontStyle":"italic"},"text":"Proof of Lemma ","element":"span"},{"href":"#id-35","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"2","element":"span"},{"style":{"fontStyle":"italic"},"text":". ","element":"span"},{"text":"First, we handle the case of ","element":"span"},{"style":{"fontStyle":"italic"},"text":"T ","element":"span"},{"text":"= 2","element":"span"},{"text":":","element":"span"}],[{"style":{"width":"50%"},"width":975,"height":168,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/16-18.png","element":"img"}],[{"style":{"width":"56%"},"width":1077,"height":145,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/17-0.png","element":"img"}],[{"text":"as desired.","element":"span"}],[{"style":{"width":"105%"},"width":2009,"height":377,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/17-1.png","element":"img"}],[{"text":"is equal to","element":"span"}],[{"style":{"width":"93%"},"width":1793,"height":1677,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/17-2.png","element":"img"}],[{"text":"where the last line follows from the fact that since ","element":"span"},{"style":{"height":16.57},"width":145.96,"height":41.44,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/17-3.png","element":"img","alt":" T ≥ semv2","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":16},"width":145.73,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/17-4.png","element":"img","alt":" s ≤ m/e","inline":true},{"text":", we know that:","element":"span"}],[{"style":{"width":"61%"},"width":1174,"height":96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/17-5.png","element":"img"}],[{"text":"Setting ","element":"span"},{"style":{"fontStyle":"italic"},"text":"t ","element":"span"},{"text":"= ","element":"span"},{"style":{"fontStyle":"italic"},"text":"T/M","element":"span"},{"text":", we obtain, up to constants:","element":"span"}],[{"style":{"width":"64%"},"width":1234,"height":102,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-0.png","element":"img"}],[{"text":"We can take a derivative to obtain the two expressions in the lemma statement at the following regimes of parameters: ","element":"span"},{"style":{"height":17.38},"width":552.7,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-1.png","element":"img","alt":" max(1, Tv2) ≤ ln(Tmv2/s) ≤ T","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":17.38},"width":288.36,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-2.png","element":"img","alt":" ln(Tmv2/s) > T","inline":true},{"text":". The second regime aligns with the lemma statement. Thus it suffices to show that when ","element":"span"},{"style":{"height":12.8},"width":68.36,"height":32,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-3.png","element":"img","alt":" v ≤","inline":true}],[{"text":"straightforward calculation","element":"span"},{"href":"#id-55","style":{"height":7.6},"width":31.88,"height":19,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-4.png","element":"img","alt":"16","inline":true},{"text":".","element":"span"}],[{"style":{"width":"96%"},"width":1852,"height":62,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-5.png","element":"img"}],[{"text":"the above calculations, without taking the sum that we obtain a lower bound of","element":"span"}],[{"style":{"width":"71%"},"width":1374,"height":179,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-6.png","element":"img"}],[{"id":"id-54","style":{"fontWeight":"bold"},"text":"D.2 ","element":"span"},{"style":{"fontWeight":"bold"},"text":"Proof of Lemma ","element":"span"},{"href":"#id-34","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"1","element":"span"}],[{"text":"In Section 2.1, we discussed the tractability issues with using the general quadratic form moment bound Lemma ","element":"span"},{"href":"#id-46","style":{"fontStyle":"italic"},"text":"C.","element":"a"},{"text":"1 ","element":"span"},{"text":"to upper bound ","element":"span"},{"style":{"height":19.18},"width":304.37,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-7.png","element":"img","alt":" ∥Zr(x1, . . . , xn)∥q","inline":true},{"text":". Thus, we require simpler bounds that are easier to analyze. Linear forms naturally arise in the upper bound since ","element":"span"},{"style":{"height":32.3},"width":990.56,"height":80.74,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-8.png","element":"img","alt":" Zr(x1, . . . , xn) =��1≤i≤n ηr,iσr,ixi�2−�1≤i≤n ηr,ix2i ≤","inline":true},{"style":{"height":32.3},"width":362.92,"height":80.74,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-9.png","element":"img","alt":"��1≤i≤n ηr,iσr,ixi�2","inline":true},{"text":". However, it turns out that a vanilla linear form bound (e.g. Proposition ","element":"span"},{"href":"#id-48","text":"C.3) ","element":"a"},{"text":"here is weak due to the loss arising from ignoring the ","element":"span"},{"style":{"height":20.57},"width":242.61,"height":51.42,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-10.png","element":"img","alt":"�1≤i≤n ηr,ix2i","inline":true,"padRight":true},{"text":"term. Thus, we use Lemma ","element":"span"},{"href":"#id-49","text":"C.4 ","element":"a"},{"text":"(our generalized ","element":"span"},{"text":"bound tailored to squares of linear forms with a zero diagonal) to obtain:","element":"span"}],[{"id":"id-58","style":{"fontWeight":"bold"},"text":"Lemma D.1 ","element":"span"},{"text":"If ","element":"span"},{"style":{"height":16.78},"width":168.52,"height":41.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-11.png","element":"img","alt":" ∥x∥∞ ≤ v","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":16.78},"width":153.64,"height":41.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-12.png","element":"img","alt":" ∥x∥2 ≤ 1","inline":true},{"text":", then we have that:","element":"span"}],[{"style":{"width":"72%"},"width":1394,"height":147,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-13.png","element":"img"}],[{"style":{"fontStyle":"italic"},"text":"Proof. ","element":"span"},{"text":"This can be seen by simply taking ","element":"span"},{"style":{"height":15.59},"width":203.14,"height":38.97,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-14.png","element":"img","alt":" Yi = ηr,iσr,i","inline":true,"padRight":true},{"text":"in Lemma ","element":"span"},{"href":"#id-49","style":{"fontStyle":"italic"},"text":"C.","element":"a"},{"text":"4","element":"span"},{"text":".","element":"span"}],[{"style":{"width":"96%"},"width":1851,"height":65,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-15.png","element":"img"}],[{"text":"on ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-16.png","element":"img","alt":" v(m, ϵ, δ, s)","inline":true,"padRight":true},{"text":"in Theorem ","element":"span"},{"href":"#id-25","text":"1.5. ","element":"a"},{"text":"The lower bound on moments of ","element":"span"},{"style":{"height":16.78},"width":414.86,"height":41.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-17.png","element":"img","alt":" ∥Zr(v, . . . , v, 0, . . . , 0)∥T","inline":true,"padRight":true},{"text":"in Lemma ","element":"span"},{"href":"#id-35","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"2 ","element":"span"},{"text":"sheds light on where this loss may be arising. We see that the problematic case is when ","element":"span"},{"style":{"height":12.8},"width":63.4,"height":32,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-18.png","element":"img","alt":" v ≥","inline":true}],[{"text":"we require a new bound for this regime. Since the vector ","element":"span"},{"style":{"height":16},"width":331.13,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-19.png","element":"img","alt":" [v1, . . . , v1, 0, . . . , 0]","inline":true,"padRight":true},{"text":"is in ","element":"span"},{"style":{"height":13.19},"width":40.44,"height":32.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-20.png","element":"img","alt":" Sv","inline":true,"padRight":true},{"text":"when ","element":"span"},{"style":{"height":12.8},"width":114.21,"height":32,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-21.png","element":"img","alt":" v1 ≤ v","inline":true},{"text":", we can’t hope to beat the bound of ","element":"span"},{"style":{"height":27.95},"width":867.96,"height":69.88,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-22.png","element":"img","alt":" ||Zr(v1, . . . , v1, 0, . . . , 0)||T ≳ T 2v21ln2(T mv21/s) ≃ Tln(m/s)","inline":true,"padRight":true},{"text":"from Lemma ","element":"span"},{"href":"#id-35","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"2","element":"span"},{"text":". We show that ","element":"span"},{"text":"we can match this value:","element":"span"}],[{"id":"id-56","style":{"fontWeight":"bold"},"text":"Lemma D.2 ","element":"span"},{"text":"Suppose that ","element":"span"},{"style":{"height":16},"width":275.86,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-23.png","element":"img","alt":" x = [x1, . . . , xn]","inline":true,"padRight":true},{"text":"satisfies ","element":"span"},{"style":{"height":16.78},"width":157.83,"height":41.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-24.png","element":"img","alt":" ∥x∥2 = 1","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":16.78},"width":172.72,"height":41.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-25.png","element":"img","alt":" ∥x∥∞ < v","inline":true},{"text":". If ","element":"span"},{"style":{"height":17.5},"width":463.99,"height":43.75,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-26.png","element":"img","alt":" s ≤ m/e, T ≥ semv2 , T ≥ 3","inline":true},{"text":", ","element":"span"},{"style":{"height":17.38},"width":258.88,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-27.png","element":"img","alt":"T ≥ ln(mv2/s)","inline":true},{"text":", then:","element":"span"}],[{"style":{"width":"96%"},"width":1852,"height":251,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-28.png","element":"img"}],[{"text":"many smaller ","element":"span"},{"style":{"height":16},"width":58.11,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-29.png","element":"img","alt":" |xi|","inline":true,"padRight":true},{"text":"that are still allowed to be present. We separate out ","element":"span"},{"style":{"height":16},"width":102.82,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-30.png","element":"img","alt":" |xi| ≥","inline":true}],[{"text":"In the quadratic form formulation of ","element":"span"},{"style":{"height":16},"width":250.02,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-31.png","element":"img","alt":" Zr(x1, . . . , xn)","inline":true},{"text":", this separation cannot be carried out, since there would","element":"span"}],[{"id":"id-55","style":{"height":13.3},"width":202.75,"height":33.25,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-32.png","element":"img","alt":"16In fact, v =","inline":true},{"style":{"height":13.2},"width":131.72,"height":33,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-33.png","element":"img","alt":"√ln(m/s)","inline":true},{"style":{"height":10},"width":44.91,"height":25,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-34.png","element":"img","alt":"√T","inline":true,"padRight":true},{"text":"is very close to the value where ","element":"span"},{"style":{"height":14.1},"width":279.46,"height":35.25,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/18-35.png","element":"img","alt":" Tv2 = ln(Tmv2/s)","inline":true},{"text":", so this approximation is essentially tight.","element":"span"}],[{"style":{"width":"25%"},"width":489,"height":15,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/19-0.png","element":"img"}],[{"text":"be cross-terms between ","element":"span"},{"style":{"height":16},"width":104.3,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/19-1.png","element":"img","alt":" |xi| ≥","inline":true}],[{"style":{"width":"83%"},"width":1604,"height":72,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/19-2.png","element":"img"}],[{"style":{"fontStyle":"italic"},"text":"Proof of Lemma ","element":"span"},{"href":"#id-56","style":{"fontStyle":"italic"},"text":"D.","element":"a"},{"text":"2","element":"span"},{"style":{"fontStyle":"italic"},"text":". ","element":"span"},{"text":"WLOG, assume that ","element":"span"},{"style":{"height":16},"width":398.02,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/19-3.png","element":"img","alt":" |x1| ≥ |x2| ≥ . . . ≥ |xn|","inline":true},{"text":". Let ","element":"span"},{"style":{"height":28.8},"width":247.03,"height":72,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/19-4.png","element":"img","alt":" P =� Tln(m/s)�","inline":true},{"text":". We know that","element":"span"}],[{"style":{"width":"55%"},"width":1063,"height":147,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/19-5.png","element":"img"}],[{"text":"For ","element":"span"},{"style":{"height":13.2},"width":170.92,"height":33,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/19-6.png","element":"img","alt":" 1 ≤ i ≤ P","inline":true},{"text":", we use the bound ","element":"span"},{"style":{"height":38.4},"width":865.53,"height":96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/19-7.png","element":"img","alt":" | �pi=1 ηr,iσr,ixi| ≤ �pi=1 |xi| ≤�� Tln(m/s)�≤ 2�","inline":true}],[{"text":"terms, we take ","element":"span"},{"style":{"height":15.59},"width":203.14,"height":38.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/19-8.png","element":"img","alt":" Yi = ηr,iσr,i","inline":true,"padRight":true},{"text":"in Proposition ","element":"span"},{"href":"#id-48","style":{"fontStyle":"italic"},"text":"C.","element":"a"},{"text":"3 ","element":"span"},{"text":"to obtain the following upper bound","element":"span"},{"href":"#id-57","style":{"height":7.6},"width":31.87,"height":19,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/19-9.png","element":"img","alt":"17","inline":true,"padRight":true},{"text":"for ","element":"span"},{"style":{"height":29.9},"width":356.16,"height":74.75,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/19-10.png","element":"img","alt":" |xi| ≤ v′ :=√ln(m/s)√T","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":16.78},"width":153.64,"height":41.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/19-11.png","element":"img","alt":" ∥x∥2 ≤ 1","inline":true},{"text":":","element":"span"}],[{"style":{"width":"42%"},"width":819,"height":98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/19-12.png","element":"img"}],[{"text":"Based on the conditions in this lemma statement, we know that ","element":"span"},{"style":{"height":24.98},"width":622.6,"height":62.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/19-13.png","element":"img","alt":"mT v′2s = mT ln(m/s)sT = ms ln(m/s) ≥ e","inline":true},{"text":". Thus ","element":"span"},{"text":"taking a derivative, we obtain that this can be upper bounded by taking ","element":"span"},{"style":{"height":17.39},"width":282.46,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/19-14.png","element":"img","alt":" t = ln(mTv′2/s)","inline":true,"padRight":true},{"text":"which yields:","element":"span"}],[{"style":{"width":"80%"},"width":1541,"height":175,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/19-15.png","element":"img"}],[{"text":"Finally, combining Lemma ","element":"span"},{"href":"#id-58","style":{"fontStyle":"italic"},"text":"D.","element":"a"},{"text":"1 ","element":"span"},{"text":"and Lemma ","element":"span"},{"href":"#id-56","style":{"fontStyle":"italic"},"text":"D.","element":"a"},{"text":"2 ","element":"span"},{"text":"yields Lemma ","element":"span"},{"href":"#id-34","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"1","element":"span"},{"text":":","element":"span"}],[{"style":{"fontStyle":"italic"},"text":"Proof of Lemma ","element":"span"},{"href":"#id-34","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"1","element":"span"},{"style":{"fontStyle":"italic"},"text":". ","element":"span"},{"text":"We apply Lemma ","element":"span"},{"href":"#id-58","style":{"fontStyle":"italic"},"text":"D.","element":"a"},{"text":"1 ","element":"span"},{"text":"at ","element":"span"},{"style":{"fontStyle":"italic"},"text":"T ","element":"span"},{"text":"= 2 ","element":"span"},{"text":"to directly obtain ","element":"span"},{"style":{"height":19.37},"width":38.13,"height":48.43,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/19-16.png","element":"img","alt":"T sm","inline":true,"padRight":true},{"text":", and for ","element":"span"},{"style":{"height":13.2},"width":101.95,"height":33,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/19-17.png","element":"img","alt":" T ≥ 3","inline":true},{"text":", we apply Lemma ","element":"span"},{"href":"#id-58","style":{"fontStyle":"italic"},"text":"D.","element":"a"},{"text":"1 ","element":"span"},{"text":"and take a derivative to obtain:","element":"span"}],[{"style":{"width":"73%"},"width":1404,"height":172,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/19-18.png","element":"img"}],[{"text":"To obtain the desired bound, we also include the bound from Lemma ","element":"span"},{"href":"#id-56","style":{"fontStyle":"italic"},"text":"D.","element":"a"},{"text":"2 ","element":"span"},{"text":"in the middle regime.","element":"span"}]]},{"heading":"E Combining rows to bound ∥R(x1, . . . , xn)∥q","paragraphs":[[{"text":"Now, we show to move from bounds on moments of individual rows (i.e. ","element":"span"},{"style":{"height":16},"width":250.03,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/19-19.png","element":"img","alt":" Zr(x1, . . . , xn)","inline":true},{"text":") to bounds on moments of ","element":"span"},{"style":{"height":16},"width":235.74,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/19-20.png","element":"img","alt":" R(x1, . . . , xn)","inline":true},{"text":". In Appendix ","element":"span"},{"href":"#id-59","text":"E.1, ","element":"a"},{"text":"we obtain an upper bound on ","element":"span"},{"style":{"height":19.18},"width":290.09,"height":47.95,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/19-21.png","element":"img","alt":" ∥R(x1, . . . , xn)∥q","inline":true},{"text":", thus proving Lemma ","element":"span"},{"href":"#id-36","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"3","element":"span"},{"text":". In Appendix ","element":"span"},{"href":"#id-60","text":"E.2, ","element":"a"},{"text":"we obtain a lower bound on ","element":"span"},{"style":{"height":19.18},"width":290.08,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/19-22.png","element":"img","alt":" ∥R(x1, . . . , xn)∥q","inline":true},{"text":", thus proving Lemma ","element":"span"},{"href":"#id-37","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"4","element":"span"},{"text":".","element":"span"}],[{"id":"id-59","style":{"fontWeight":"bold"},"text":"E.1 ","element":"span"},{"style":{"fontWeight":"bold"},"text":"Proof of Lemma ","element":"span"},{"text":"2","element":"span"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"href":"#id-36","text":"3","element":"a"}],[{"text":"Since the ","element":"span"},{"style":{"height":11.59},"width":54.16,"height":28.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/19-23.png","element":"img","alt":" ηr,i","inline":true,"padRight":true},{"text":"are negatively correlated, we can always upper bound the moments of ","element":"span"},{"style":{"height":16},"width":235.74,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/19-24.png","element":"img","alt":" R(x1, . . . , xn)","inline":true,"padRight":true},{"text":"by the case of a sum of ","element":"span"},{"style":{"fontStyle":"italic"},"text":"independent ","element":"span"},{"text":"random variables when ","element":"span"},{"style":{"fontStyle":"italic"},"text":"q ","element":"span"},{"text":"is even","element":"span"},{"style":{"height":17.38},"width":599.72,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/19-25.png","element":"img","alt":"18 Z′r(x1, . . . , xn) ∼ Zr(x1, . . . , xn)","inline":true},{"text":".","element":"span"}],[{"style":{"width":"61%"},"width":1167,"height":33,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/19-26.png","element":"img"}],[{"id":"id-62","style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"style":{"height":16},"width":124.69,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/19-27.png","element":"img","alt":" · ∥R(x1","inline":true},{"style":{"fontStyle":"italic"},"text":", . . . , x","element":"span"},{"style":{"height":19.18},"width":116.78,"height":47.95,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/19-28.png","element":"img","alt":"n)∥q ≤","inline":true}],[{"id":"id-57","style":{"width":"99%"},"width":1909,"height":85,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/19-29.png","element":"img"}],[{"text":"where the last inequality follows from Lemma ","element":"span"},{"href":"#id-61","style":{"fontStyle":"italic"},"text":"C.","element":"a"},{"text":"5","element":"span"},{"text":". Thus, it remains to analyze the ","element":"span"},{"text":"sup ","element":"span"},{"text":"expression. It turns out that each regime of bounds in Lemma ","element":"span"},{"href":"#id-34","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"1 ","element":"span"},{"text":"collapses to one value, so the different regimes in Lemma ","element":"span"},{"href":"#id-34","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"1 ","element":"span"},{"text":"correspond to different parts of the ","element":"span"},{"text":"max ","element":"span"},{"text":"expressions in Lemma ","element":"span"},{"href":"#id-36","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"3","element":"span"},{"text":". Depending on the parameters, some of these regimes may not exist, as is reflected by branches of the ","element":"span"},{"text":"max ","element":"span"},{"text":"expression sometimes vanishing in Lemma ","element":"span"},{"href":"#id-34","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"1","element":"span"},{"text":". We defer the computation to Appendix ","element":"span"},{"text":"F.","element":"span"}],[{"id":"id-60","style":{"fontWeight":"bold"},"text":"E.2 ","element":"span"},{"style":{"fontWeight":"bold"},"text":"Proof of Lemma ","element":"span"},{"text":"2","element":"span"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"href":"#id-37","text":"4","element":"a"}],[{"text":"Moving from a lower bound on the moments of individual rows given by Lemma ","element":"span"},{"href":"#id-35","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"2 ","element":"span"},{"text":"to moments of ","element":"span"},{"style":{"fontStyle":"italic"},"text":"R","element":"span"},{"text":"(","element":"span"},{"style":{"fontStyle":"italic"},"text":"v, . . . , v, ","element":"span"},{"text":"0","element":"span"},{"style":{"fontStyle":"italic"},"text":", . . . , ","element":"span"},{"text":"0) ","element":"span"},{"text":"is more delicate. Unlike in the upper bound, the negative correlations between random variables require some care to handle, even with the simplification that the ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"nonzero entries in a column are chosen uniformly at random. For example, the conditional distribution of ","element":"span"},{"style":{"height":16.79},"width":611.18,"height":41.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/20-0.png","element":"img","alt":" ηs+1,1 | η1,1 = η2,1 = . . . = ηs,1 = 1","inline":true,"padRight":true},{"text":"is ","element":"span"},{"text":"0","element":"span"},{"text":", while the marginal distribution of ","element":"span"},{"style":{"height":11.59},"width":100.64,"height":28.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/20-1.png","element":"img","alt":" ηs+1,1","inline":true,"padRight":true},{"text":"has expectation ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s/m","element":"span"},{"text":". One aspect that simplifies our analysis is that we ","element":"span"},{"style":{"fontStyle":"italic"},"text":"know ","element":"span"},{"text":"from our proof of Lemma ","element":"span"},{"href":"#id-36","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"3 ","element":"span"},{"text":"which moments of ","element":"span"},{"style":{"height":16},"width":250.03,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/20-2.png","element":"img","alt":" Zr(x1, . . . , xn)","inline":true,"padRight":true},{"text":"are critical in the ","element":"span"},{"text":"sup ","element":"span"},{"text":"expression in ","element":"span"},{"href":"#id-62","text":"(2)","element":"a"},{"text":". We only need to account for these particular moments in our lower bound approach. It turns out that the three critical values are ","element":"span"},{"style":{"fontStyle":"italic"},"text":"q/T ","element":"span"},{"text":"= 2","element":"span"},{"text":", ","element":"span"},{"style":{"fontStyle":"italic"},"text":"q/T ","element":"span"},{"text":"= ","element":"span"},{"style":{"fontStyle":"italic"},"text":"q","element":"span"},{"text":", and ","element":"span"},{"style":{"height":17.38},"width":335.12,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/20-3.png","element":"img","alt":" q/T = ln(qmv4/s2)","inline":true},{"text":".","element":"span"}],[{"text":"For ","element":"span"},{"style":{"fontStyle":"italic"},"text":"q/T ","element":"span"},{"text":"= ","element":"span"},{"style":{"fontStyle":"italic"},"text":"q","element":"span"},{"text":", where rows are isolated, we can directly obtain a bound from Lemma ","element":"span"},{"href":"#id-50","style":{"fontStyle":"italic"},"text":"C.","element":"a"},{"text":"6 ","element":"span"},{"text":"and Lemma ","element":"span"},{"href":"#id-35","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"2 ","element":"span"},{"text":"to obtain.","element":"span"}],[{"id":"id-64","style":{"fontWeight":"bold"},"text":"Lemma E.1 ","element":"span"},{"text":"Suppose ","element":"span"},{"style":{"height":16.39},"width":114.05,"height":40.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/20-4.png","element":"img","alt":" As,m,n","inline":true,"padRight":true},{"text":"is a uniform sparse JL distribution. Suppose that ","element":"span"},{"style":{"fontStyle":"italic"},"text":"q ","element":"span"},{"text":"is even, ","element":"span"},{"style":{"height":17.5},"width":307.39,"height":43.74,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/20-5.png","element":"img","alt":" s ≤ m/e, q ≥ semv2","inline":true,"padRight":true},{"text":",","element":"span"}],[{"style":{"width":"74%"},"width":1419,"height":211,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/20-6.png","element":"img"}],[{"style":{"fontStyle":"italic"},"text":"Proof. ","element":"span"},{"text":"By Lemma ","element":"span"},{"href":"#id-50","style":{"fontStyle":"italic"},"text":"C.","element":"a"},{"text":"6 ","element":"span"},{"text":"with ","element":"span"},{"style":{"fontStyle":"italic"},"text":"T ","element":"span"},{"text":"= 1","element":"span"},{"text":", we have that:","element":"span"}],[{"style":{"width":"76%"},"width":1468,"height":90,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/20-7.png","element":"img"}],[{"text":"Now, we apply Lemma ","element":"span"},{"href":"#id-35","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"2 ","element":"span"},{"text":"to obtain the desired expression.","element":"span"}],[{"text":"For ","element":"span"},{"style":{"fontStyle":"italic"},"text":"q/T ","element":"span"},{"text":"= 2 ","element":"span"},{"text":"and ","element":"span"},{"style":{"height":17.38},"width":342.96,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/20-8.png","element":"img","alt":" q/T = ln(qmv4/s2)","inline":true},{"text":", we make use of the Lemma ","element":"span"},{"href":"#id-63","text":"E.2 ","element":"a"},{"text":"that relates moments of products of rows to products of moments of rows by taking advantage of either ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"and ","element":"span"},{"style":{"height":19.37},"width":30.94,"height":48.43,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/20-9.png","element":"img","alt":"1v2","inline":true,"padRight":true},{"text":"being sufficiently large. The ","element":"span"},{"text":"method essentially uses a counting argument to show that not too many terms vanish as a result of negative correlations, and requires adding in an indicator for the number of nonzero entries in a row being ","element":"span"},{"text":"2 ","element":"span"},{"text":"for some cases (which is sufficient to prove Lemma ","element":"span"},{"href":"#id-37","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"4","element":"span"},{"text":").","element":"span"}],[{"id":"id-63","style":{"fontWeight":"bold"},"text":"Lemma E.2 ","element":"span"},{"text":"Suppose ","element":"span"},{"style":{"height":16.39},"width":114.06,"height":40.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/20-10.png","element":"img","alt":" As,m,n","inline":true,"padRight":true},{"text":"is a uniform sparse JL distribution. If ","element":"span"},{"style":{"height":16},"width":214.16,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/20-11.png","element":"img","alt":" 1 ≤ T ≤ q/2","inline":true,"padRight":true},{"text":"is an integer, ","element":"span"},{"style":{"fontStyle":"italic"},"text":"q/T ","element":"span"},{"text":"is an even integer, ","element":"span"},{"style":{"height":19.37},"width":30.94,"height":48.44,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/20-12.png","element":"img","alt":"1v2","inline":true,"padRight":true},{"text":"is an even integer, and ","element":"span"},{"style":{"height":15.79},"width":159.51,"height":39.47,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/20-13.png","element":"img","alt":" 2Tv2 ≤ s","inline":true},{"text":", then:","element":"span"}],[{"style":{"width":"81%"},"width":1565,"height":147,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/20-14.png","element":"img"}],[{"text":"We defer the proof to Appendix ","element":"span"},{"text":"G. ","element":"span"},{"text":"Now we can use Lemma ","element":"span"},{"href":"#id-50","style":{"fontStyle":"italic"},"text":"C.","element":"a"},{"text":"6 ","element":"span"},{"text":"coupled with Lemma ","element":"span"},{"href":"#id-63","style":{"fontStyle":"italic"},"text":"E.","element":"a"},{"text":"2 ","element":"span"},{"text":"and Lemma ","element":"span"},{"href":"#id-35","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"2 ","element":"span"},{"text":"to handle the cases of ","element":"span"},{"style":{"fontStyle":"italic"},"text":"q/T ","element":"span"},{"text":"= ","element":"span"},{"style":{"height":17.39},"width":251.66,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/20-15.png","element":"img","alt":"2, ln(qmv4/s2)","inline":true,"padRight":true},{"text":"and obtain the following bounds. For ","element":"span"},{"style":{"fontStyle":"italic"},"text":"q/T ","element":"span"},{"text":"= 2","element":"span"},{"text":", we obtain:","element":"span"}],[{"id":"id-65","style":{"fontWeight":"bold"},"text":"Lemma E.3 ","element":"span"},{"text":"Suppose ","element":"span"},{"style":{"height":16.39},"width":114.05,"height":40.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/20-16.png","element":"img","alt":" As,m,n","inline":true,"padRight":true},{"text":"is a uniform sparse JL distribution. If ","element":"span"},{"style":{"fontStyle":"italic"},"text":"q ","element":"span"},{"text":"is an even integer, ","element":"span"},{"style":{"height":23.02},"width":130,"height":57.54,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/20-17.png","element":"img","alt":"qv2s ≤ 1","inline":true},{"text":", and ","element":"span"},{"style":{"height":19.37},"width":30.95,"height":48.43,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/20-18.png","element":"img","alt":"1v2","inline":true,"padRight":true},{"text":"is ","element":"span"},{"text":"an even integer, then it is true that:","element":"span"}],[{"style":{"width":"86%"},"width":1652,"height":315,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/20-19.png","element":"img"}],[{"text":"Now, by Lemma ","element":"span"},{"href":"#id-35","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"2","element":"span"},{"text":", we can see that ","element":"span"},{"style":{"height":17.5},"width":495.89,"height":43.74,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/21-0.png","element":"img","alt":" ∥Z1(v, . . . , v, 0, . . . , 0)∥2 ≳ sm","inline":true},{"text":". Thus, our bound becomes:","element":"span"}],[{"style":{"width":"61%"},"width":1177,"height":178,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/21-1.png","element":"img"}],[{"text":"For ","element":"span"},{"style":{"height":17.38},"width":335.12,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/21-2.png","element":"img","alt":" q/T = ln(qmv4/s2)","inline":true},{"text":", we similarly obtain the following bound using Lemma ","element":"span"},{"href":"#id-50","style":{"fontStyle":"italic"},"text":"C.","element":"a"},{"text":"6 ","element":"span"},{"text":"coupled with Lemma ","element":"span"},{"href":"#id-63","style":{"fontStyle":"italic"},"text":"E.","element":"a"},{"text":"2","element":"span"},{"text":".","element":"span"}],[{"id":"id-66","style":{"fontWeight":"bold"},"text":"Lemma E.4 ","element":"span"},{"text":"Suppose ","element":"span"},{"style":{"height":16.39},"width":114.06,"height":40.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/21-3.png","element":"img","alt":" As,m,n","inline":true,"padRight":true},{"text":"is a uniform sparse JL distribution. Suppose that ","element":"span"},{"style":{"fontStyle":"italic"},"text":"q ","element":"span"},{"text":"is a power of ","element":"span"},{"style":{"height":16},"width":196.86,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/21-4.png","element":"img","alt":" 2, s ≤ m/e","inline":true},{"text":", ","element":"span"},{"style":{"height":19.37},"width":480.74,"height":48.44,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/21-5.png","element":"img","alt":"2qv2 ≤ 0.5s ln(qmv4/s2), 1v2","inline":true,"padRight":true},{"text":"is even, ","element":"span"},{"style":{"height":17.39},"width":358.71,"height":43.47,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/21-6.png","element":"img","alt":" 2 ≤ ln(qmv4/s2) ≤ q","inline":true},{"text":", and ","element":"span"},{"style":{"height":13.6},"width":107.12,"height":34,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/21-7.png","element":"img","alt":" m ≥ q","inline":true},{"text":". Then it is true that:","element":"span"}],[{"style":{"width":"33%"},"width":636,"height":109,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/21-8.png","element":"img"}],[{"style":{"fontStyle":"italic"},"text":"Proof. ","element":"span"},{"text":"Let’s let ","element":"span"},{"style":{"fontStyle":"italic"},"text":"f","element":"span"},{"text":"(","element":"span"},{"style":{"fontStyle":"italic"},"text":"x","element":"span"},{"text":") ","element":"span"},{"text":"be the function that rounds ","element":"span"},{"style":{"fontStyle":"italic"},"text":"x ","element":"span"},{"text":"to the nearest power of ","element":"span"},{"text":"2","element":"span"},{"text":". By the conditions, we know that ","element":"span"},{"style":{"height":17.38},"width":453.87,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/21-9.png","element":"img","alt":" 2 ≤ f(ln(qmv4/s2)) ≤ q","inline":true},{"text":". ","element":"span"},{"text":"Now, we want the condition ","element":"span"},{"style":{"height":17.38},"width":438.59,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/21-10.png","element":"img","alt":" 2qv2 ≤ sf(ln(qmv4/s2))","inline":true,"padRight":true},{"text":"to be satisfied. ","element":"span"},{"text":"If ","element":"span"},{"style":{"height":17.38},"width":538.89,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/21-11.png","element":"img","alt":"f(ln(qmv4/s2)) ≥ ln(qmv4/s2)","inline":true},{"text":", then this is implied by ","element":"span"},{"style":{"height":17.38},"width":811.86,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/21-12.png","element":"img","alt":" 2qv2 ≤ s ln(qmv4/s2) = s max(ln(qmv4/s2), 2)","inline":true},{"text":", which is a strictly weaker condition than the one given in the lemma statement. If ","element":"span"},{"style":{"height":17.38},"width":540.2,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/21-13.png","element":"img","alt":" f(ln(qmv4/s2)) ≤ ln(qmv4/s2)","inline":true},{"text":", then ","element":"span"},{"style":{"height":17.39},"width":598.33,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/21-14.png","element":"img","alt":" f(ln(qmv4/s2)) ≥ 0.5 ln(qmv4/s2)","inline":true,"padRight":true},{"text":"and so ","element":"span"},{"style":{"height":17.39},"width":771.9,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/21-15.png","element":"img","alt":" 2qv2 ≤ 0.5s ln(qmv4/s2) ≤ sf(ln(qmv4/s2))","inline":true,"padRight":true},{"text":"gives the desired condition.","element":"span"}],[{"text":"We use the fact that ","element":"span"},{"style":{"height":17.38},"width":914.55,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/21-16.png","element":"img","alt":" ln(qmv4/s2)/2 ≤ f(ln(qmv4/s2)) ≤ 2 ln(qmv4/s2)","inline":true},{"text":". ","element":"span"},{"text":"We apply Lemma ","element":"span"},{"href":"#id-63","text":"E.2 ","element":"a"},{"text":"and Lemma ","element":"span"},{"href":"#id-50","text":"C.6, ","element":"a"},{"text":"with ","element":"span"},{"style":{"height":20.21},"width":321.2,"height":50.52,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/21-17.png","element":"img","alt":" T = qf(ln(qmv4/s2))","inline":true,"padRight":true},{"text":"and Lemma ","element":"span"},{"href":"#id-35","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"2 ","element":"span"},{"text":"to see that if we have the additional condition that ","element":"span"},{"style":{"height":18.88},"width":385.45,"height":47.2,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/21-18.png","element":"img","alt":"f(ln(qmv4/s2)) ≥ semv2","inline":true,"padRight":true},{"text":", then we know that:","element":"span"}],[{"style":{"width":"99%"},"width":1910,"height":1030,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/21-19.png","element":"img"}],[{"text":"With these bounds, Lemma ","element":"span"},{"href":"#id-37","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"4 ","element":"span"},{"text":"follows.","element":"span"}],[{"style":{"fontStyle":"italic"},"text":"Proof of Lemma ","element":"span"},{"href":"#id-37","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"4","element":"span"},{"style":{"fontStyle":"italic"},"text":". ","element":"span"},{"text":"We combine Lemma ","element":"span"},{"href":"#id-64","style":{"fontStyle":"italic"},"text":"E.","element":"a"},{"text":"1","element":"span"},{"text":", Lemma ","element":"span"},{"href":"#id-65","style":{"fontStyle":"italic"},"text":"E.","element":"a"},{"text":"3","element":"span"},{"text":", and Lemma ","element":"span"},{"href":"#id-66","style":{"fontStyle":"italic"},"text":"E.","element":"a"},{"text":"4","element":"span"},{"text":".","element":"span"}]]},{"heading":"F Proofs of Auxiliary Lemmas for Lemma 2.3","paragraphs":[[{"text":"First, we use Lemma ","element":"span"},{"href":"#id-61","style":{"fontStyle":"italic"},"text":"C.","element":"a"},{"text":"5 ","element":"span"},{"text":"and Lemma ","element":"span"},{"href":"#id-34","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"1 ","element":"span"},{"text":"to prove a upper bound ","element":"span"},{"style":{"height":19.76},"width":286,"height":49.4,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/21-20.png","element":"img","alt":" ∥R(x1, . . . , xq)∥q","inline":true,"padRight":true},{"text":"that is not quite in the ","element":"span"},{"id":"id-67","text":"desired form for Lemma ","element":"span"},{"href":"#id-36","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"3","element":"span"},{"text":".","element":"span"}],[{"style":{"fontWeight":"bold"},"text":"Lemma F.1 ","element":"span"},{"text":"Let ","element":"span"},{"style":{"height":14},"width":180.42,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/22-0.png","element":"img","alt":" 2 ≤ q ≤ m","inline":true,"padRight":true},{"text":"be an even integer and ","element":"span"},{"style":{"height":16},"width":130.31,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/22-1.png","element":"img","alt":" |xi| ≤ v","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":16.78},"width":153.66,"height":41.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/22-2.png","element":"img","alt":" ∥x∥2 = 1","inline":true},{"text":". If ","element":"span"},{"style":{"height":16.57},"width":137.68,"height":41.43,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/22-3.png","element":"img","alt":"semv2 ≥ q","inline":true},{"text":", then:","element":"span"}],[{"style":{"width":"29%"},"width":570,"height":48,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/22-4.png","element":"img"}],[{"text":"If ","element":"span"},{"style":{"height":17.38},"width":267.79,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/22-5.png","element":"img","alt":" ln(qmv2/s) > q","inline":true,"padRight":true},{"text":"then we have","element":"span"}],[{"style":{"width":"47%"},"width":914,"height":48,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/22-6.png","element":"img"}],[{"text":"In all other cases, we have that","element":"span"}],[{"style":{"width":"77%"},"width":1490,"height":48,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/22-7.png","element":"img"}],[{"text":"The functions are defined as follows.","element":"span"}],[{"style":{"width":"65%"},"width":1261,"height":535,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/22-8.png","element":"img"}],[{"style":{"fontStyle":"italic"},"text":"Proof of Lemma ","element":"span"},{"href":"#id-67","style":{"fontStyle":"italic"},"text":"F.","element":"a"},{"text":"1","element":"span"},{"style":{"fontStyle":"italic"},"text":". ","element":"span"},{"text":"As we discussed in Appendix ","element":"span"},{"text":"E, ","element":"span"},{"text":"it suffices to bound","element":"span"}],[{"style":{"width":"34%"},"width":663,"height":108,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/22-9.png","element":"img"}],[{"text":"Our bounds on ","element":"span"},{"style":{"height":16.78},"width":301.6,"height":41.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/22-10.png","element":"img","alt":" ∥Z1(x1, . . . , xn)∥t","inline":true,"padRight":true},{"text":"are based on Lemma ","element":"span"},{"href":"#id-34","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"1","element":"span"},{"text":". We split into cases based on the ","element":"span"},{"style":{"fontStyle":"italic"},"text":"T ","element":"span"},{"text":"value, and how it separates into different cases in Lemma ","element":"span"},{"href":"#id-34","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"1","element":"span"},{"text":". Let","element":"span"}],[{"style":{"width":"99%"},"width":1912,"height":714,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/22-11.png","element":"img"}],[{"text":"Let’s first consider ","element":"span"},{"style":{"height":16.57},"width":137.69,"height":41.43,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/22-12.png","element":"img","alt":"semv2 ≥ q","inline":true},{"text":". In this case, only the ","element":"span"},{"style":{"height":14.4},"width":38.54,"height":36,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/22-13.png","element":"img","alt":" β1","inline":true,"padRight":true},{"text":"branch arises. Now, suppose that ","element":"span"},{"style":{"height":16.57},"width":137.71,"height":41.43,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/22-14.png","element":"img","alt":"semv2 < q","inline":true},{"text":". ","element":"span"},{"text":"Suppose that ","element":"span"},{"style":{"height":17.38},"width":271.47,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/22-15.png","element":"img","alt":" ln(qmv2/s) > q","inline":true},{"text":". Then we show that the ","element":"span"},{"style":{"height":14.4},"width":54.44,"height":36,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/22-16.png","element":"img","alt":" β34","inline":true,"padRight":true},{"text":"branch does not arise. It suffices to show that ","element":"span"},{"style":{"height":17.38},"width":288.06,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/22-17.png","element":"img","alt":"ln(Tmv2/s) > T","inline":true,"padRight":true},{"text":"for all ","element":"span"},{"style":{"height":16.57},"width":146.64,"height":41.44,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/22-18.png","element":"img","alt":" T ≥ semv2","inline":true,"padRight":true},{"text":". Let ","element":"span"},{"style":{"height":17.38},"width":217.94,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/22-19.png","element":"img","alt":" x = Tmv2/s","inline":true},{"text":". It suffices to show that ","element":"span"},{"style":{"height":16.57},"width":199.07,"height":41.44,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/22-20.png","element":"img","alt":"smv2 xln x < 1","inline":true,"padRight":true},{"text":"for all ","element":"span"},{"style":{"height":23.02},"width":228.56,"height":57.55,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/22-21.png","element":"img","alt":" e ≤ x ≤ qmv2s","inline":true,"padRight":true},{"text":".","element":"span"}],[{"text":"Since ","element":"span"},{"style":{"height":16.57},"width":198.39,"height":41.43,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/22-22.png","element":"img","alt":"smv2 xln x < 1","inline":true,"padRight":true},{"text":"at ","element":"span"},{"style":{"height":23.02},"width":155.52,"height":57.54,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/22-23.png","element":"img","alt":" x = qmv2s","inline":true,"padRight":true},{"text":"and this is an increasing function of ","element":"span"},{"style":{"fontStyle":"italic"},"text":"x","element":"span"},{"text":", we know that the condition is true. We now produce bounds ","element":"span"},{"style":{"height":16},"width":531.32,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/22-24.png","element":"img","alt":" α1(q, v, s, m), . . . , α4(q, v, s, m)","inline":true,"padRight":true},{"text":"such that ","element":"span"},{"style":{"height":16},"width":481.84,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/22-25.png","element":"img","alt":" βi(q, v, sm) ≲ αi(q, v, s, m)","inline":true},{"text":", which is what we do for the remainder of the analysis.","element":"span"}],[{"text":"First, we handle the ","element":"span"},{"style":{"height":16},"width":218.68,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/23-0.png","element":"img","alt":" β1(q, v, s, m)","inline":true,"padRight":true},{"text":"term. We see that","element":"span"}],[{"style":{"width":"74%"},"width":1430,"height":118,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/23-1.png","element":"img"}],[{"text":"Now, we handle the ","element":"span"},{"style":{"height":16},"width":218.68,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/23-2.png","element":"img","alt":" β2(q, v, s, m)","inline":true,"padRight":true},{"text":"term. We obtain a bound for ","element":"span"},{"style":{"height":23.5},"width":402.84,"height":58.76,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/23-3.png","element":"img","alt":" ∥Zr∥T ≲ v2 � smT v2�2/T","inline":true,"padRight":true},{"text":". The expression becomes:","element":"span"}],[{"style":{"width":"63%"},"width":1214,"height":396,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/23-4.png","element":"img"}],[{"text":"Suppose that ","element":"span"},{"style":{"height":17.39},"width":286.66,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/23-5.png","element":"img","alt":" ln(qmv4/s2) ≥ 2","inline":true},{"text":". In this case, we have that this expression is upper bounded by ","element":"span"},{"style":{"height":17.39},"width":295.97,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/23-6.png","element":"img","alt":" T = ln(qmv4/s2)","inline":true},{"text":". When we plug this into the expression, we obtain ","element":"span"},{"style":{"height":25.82},"width":194.86,"height":64.54,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/23-7.png","element":"img","alt":"qv2s ln(qmv4/s2)","inline":true},{"text":". ","element":"span"},{"text":"Otherwise, if ","element":"span"},{"style":{"height":17.39},"width":303.32,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/23-8.png","element":"img","alt":" ln(qmv4/s2) ≤ 2","inline":true},{"text":", then this expression is upper bounded by ","element":"span"},{"style":{"fontStyle":"italic"},"text":"T ","element":"span"},{"text":"= 3","element":"span"},{"text":":","element":"span"}],[{"style":{"width":"30%"},"width":585,"height":109,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/23-9.png","element":"img"}],[{"text":"We know that that ","element":"span"},{"style":{"height":26.78},"width":247.76,"height":66.94,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/23-10.png","element":"img","alt":"q2/3v2/3s1/3m1/3 ≤ √q√m","inline":true,"padRight":true},{"text":"because this reduces to","element":"span"}],[{"style":{"width":"32%"},"width":625,"height":109,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/23-11.png","element":"img"}],[{"text":"Now, we handle the ","element":"span"},{"style":{"height":16},"width":218.68,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/23-12.png","element":"img","alt":" β4(q, v, s, m)","inline":true,"padRight":true},{"text":"term when ","element":"span"},{"style":{"height":17.38},"width":267.78,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/23-13.png","element":"img","alt":" ln(qmv2/s) ≤ q","inline":true},{"text":".","element":"span"}],[{"style":{"width":"63%"},"width":1223,"height":396,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/23-14.png","element":"img"}],[{"text":"If ","element":"span"},{"style":{"height":16.58},"width":128.4,"height":41.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/23-15.png","element":"img","alt":" s ≤ qv2","inline":true},{"text":", this is bounded by ","element":"span"},{"text":"1","element":"span"},{"text":", and if ","element":"span"},{"style":{"height":16.58},"width":128.41,"height":41.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/23-16.png","element":"img","alt":" s ≥ qv2","inline":true},{"text":", this is bounded by","element":"span"},{"style":{"height":35.11},"width":286.14,"height":87.77,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/23-17.png","element":"img","alt":"� sqv2�1/ ln(mv2/s)","inline":true},{"text":". We see that ","element":"span"},{"style":{"height":24.58},"width":170.64,"height":61.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/23-18.png","element":"img","alt":"sqv2 ≤ mv2s","inline":true,"padRight":true},{"text":",","element":"span"}],[{"style":{"width":"72%"},"width":1377,"height":77,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/23-19.png","element":"img"}],[{"text":"Now, we handle the ","element":"span"},{"style":{"height":16},"width":218.68,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/23-20.png","element":"img","alt":" β3(q, v, s, m)","inline":true,"padRight":true},{"text":"term. In this case, the expression becomes:","element":"span"}],[{"style":{"width":"84%"},"width":1618,"height":459,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/23-21.png","element":"img"}],[{"text":"We use some function bounding arguments to come with a simpler bound for ","element":"span"},{"style":{"height":9.19},"width":41.49,"height":22.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/24-0.png","element":"img","alt":" α3","inline":true,"padRight":true},{"text":"for sufficiently large ","element":"span"},{"style":{"fontStyle":"italic"},"text":"v","element":"span"},{"text":".","element":"span"}],[{"id":"id-68","style":{"fontWeight":"bold"},"text":"Lemma F.2 ","element":"span"},{"text":"Assume that ","element":"span"},{"style":{"height":16.59},"width":244.88,"height":41.47,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/24-1.png","element":"img","alt":" C2q3mv4 ≥ s2","inline":true,"padRight":true},{"text":"for some ","element":"span"},{"style":{"height":13.2},"width":119.49,"height":33,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/24-2.png","element":"img","alt":" C2 ≥ 1","inline":true},{"text":". Then it is true that","element":"span"}],[{"style":{"width":"63%"},"width":1213,"height":118,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/24-3.png","element":"img"}],[{"style":{"fontStyle":"italic"},"text":"Proof of Lemma ","element":"span"},{"href":"#id-68","style":{"fontStyle":"italic"},"text":"F.","element":"a"},{"text":"2","element":"span"},{"style":{"fontStyle":"italic"},"text":". ","element":"span"},{"text":"With the assumptions that we made we know that ","element":"span"},{"style":{"height":26.1},"width":225.93,"height":65.25,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/24-4.png","element":"img","alt":"sq3v2C22 ≤ mv2s","inline":true,"padRight":true},{"text":". This implies that our ","element":"span"},{"text":"expression becomes:","element":"span"}],[{"style":{"width":"84%"},"width":1609,"height":550,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/24-5.png","element":"img"}],[{"text":"Let ","element":"span"},{"style":{"height":13.19},"width":82.84,"height":32.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/24-6.png","element":"img","alt":" Tmin","inline":true,"padRight":true},{"text":"be the minimum ","element":"span"},{"style":{"fontStyle":"italic"},"text":"T ","element":"span"},{"text":"such that ","element":"span"},{"style":{"height":18.88},"width":517.45,"height":47.2,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/24-7.png","element":"img","alt":" T ≥ max( semv2 , 3, ln(mv2T/s))","inline":true},{"text":". We just need to bound","element":"span"}],[{"style":{"width":"84%"},"width":1622,"height":256,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/24-8.png","element":"img"}],[{"text":"First, we handle the second term. Let ","element":"span"},{"style":{"height":22.18},"width":173.19,"height":55.45,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/24-9.png","element":"img","alt":" Q = mv2Ts","inline":true,"padRight":true},{"text":". We use that ","element":"span"},{"style":{"height":16.57},"width":201.67,"height":41.43,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/24-10.png","element":"img","alt":" Tmin ≥ semv2","inline":true,"padRight":true},{"text":", so ","element":"span"},{"style":{"height":22.44},"width":211.15,"height":56.1,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/24-11.png","element":"img","alt":" mv2Tmins ≥ e","inline":true,"padRight":true},{"text":"to conclude ","element":"span"},{"style":{"height":14},"width":103.64,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/24-12.png","element":"img","alt":" Q ≥ e","inline":true},{"text":". We see that","element":"span"}],[{"style":{"width":"55%"},"width":1069,"height":97,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/24-13.png","element":"img"}],[{"text":"We see that setting ","element":"span"},{"style":{"fontStyle":"italic"},"text":"Q ","element":"span"},{"text":"to its maximum value achieves within a factor of ","element":"span"},{"style":{"fontStyle":"italic"},"text":"e ","element":"span"},{"text":"of the maximum value of ","element":"span"},{"style":{"height":23.43},"width":91.73,"height":58.56,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/24-14.png","element":"img","alt":"Qln2(Q)","inline":true},{"text":". ","element":"span"},{"text":"Thus, we obtain that this is upper bounded by ","element":"span"},{"style":{"height":22.1},"width":215.59,"height":55.26,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/24-15.png","element":"img","alt":" e3 qln2(mv2q/s)","inline":true},{"text":".","element":"span"}],[{"text":"Now, we just need to handle the first term. If ","element":"span"},{"style":{"height":14},"width":196.52,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/24-16.png","element":"img","alt":" Tmin ≥ ln q","inline":true},{"text":", then this term doesn’t exist. Let’s take a log of the expression to obtain:","element":"span"}],[{"style":{"width":"75%"},"width":1440,"height":261,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/24-17.png","element":"img"}],[{"text":"The sign of the derivative is the same as:","element":"span"}],[{"style":{"width":"22%"},"width":431,"height":93,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/24-18.png","element":"img"}],[{"text":"Since ","element":"span"},{"style":{"height":16.57},"width":207.86,"height":41.43,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/24-19.png","element":"img","alt":" Tmin ≥ semv2","inline":true,"padRight":true},{"text":", we know that ","element":"span"},{"style":{"height":17.38},"width":283.46,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/24-20.png","element":"img","alt":" ln(mv2T/s) ≥ 0","inline":true},{"text":". Thus, we know that ","element":"span"},{"style":{"height":22.17},"width":325.93,"height":55.43,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/24-21.png","element":"img","alt":" 1 − 2ln(mv2T/s) ≤ 1","inline":true},{"text":". Since ","element":"span"},{"style":{"height":14},"width":147,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/24-22.png","element":"img","alt":" T ≤ ln q","inline":true},{"text":", ","element":"span"},{"text":"we know that ","element":"span"},{"style":{"height":20.21},"width":129.12,"height":50.52,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/24-23.png","element":"img","alt":"ln qT ≥ 1","inline":true},{"text":", so ","element":"span"},{"style":{"height":20.21},"width":217.21,"height":50.52,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/24-24.png","element":"img","alt":" − 2 ln qT ≤ −2","inline":true},{"text":". Thus, the derivative is negative, so the ","element":"span"},{"text":"sup ","element":"span"},{"text":"is attained at ","element":"span"},{"style":{"height":13.19},"width":170.2,"height":32.97,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/24-25.png","element":"img","alt":" Tmin = T","inline":true},{"text":", where the expression is:","element":"span"}],[{"style":{"width":"56%"},"width":1088,"height":104,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/24-26.png","element":"img"}],[{"text":"Thus, to upper bound by ","element":"span"},{"style":{"height":20.63},"width":174.38,"height":51.56,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/25-0.png","element":"img","alt":"qln2(mv2q/s)","inline":true},{"text":", it suffices to show:","element":"span"}],[{"style":{"width":"99%"},"width":1910,"height":626,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/25-1.png","element":"img"}],[{"text":"Now, we combine Lemma ","element":"span"},{"href":"#id-67","style":{"fontStyle":"italic"},"text":"F.","element":"a"},{"text":"1 ","element":"span"},{"text":"and Lemma ","element":"span"},{"href":"#id-68","style":{"fontStyle":"italic"},"text":"F.","element":"a"},{"text":"2 ","element":"span"},{"text":"to prove Lemma ","element":"span"},{"href":"#id-36","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"3","element":"span"},{"text":".","element":"span"}],[{"style":{"fontStyle":"italic"},"text":"Proof of Lemma ","element":"span"},{"href":"#id-36","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"3","element":"span"},{"style":{"fontStyle":"italic"},"text":". ","element":"span"},{"text":"First, we compute the second moment by hand:","element":"span"}],[{"style":{"width":"52%"},"width":1006,"height":569,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/25-2.png","element":"img"}],[{"text":"For ","element":"span"},{"style":{"height":14},"width":182.42,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/25-3.png","element":"img","alt":" 2 < q ≤ m","inline":true},{"text":", we apply Lemma ","element":"span"},{"href":"#id-67","style":{"fontStyle":"italic"},"text":"F.","element":"a"},{"text":"1 ","element":"span"},{"text":"and Lemma ","element":"span"},{"href":"#id-68","style":{"fontStyle":"italic"},"text":"F.","element":"a"},{"text":"2","element":"span"},{"text":". We only include ","element":"span"},{"style":{"height":9.19},"width":41.49,"height":22.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/25-4.png","element":"img","alt":" α4","inline":true,"padRight":true},{"text":"when ","element":"span"},{"style":{"height":17.38},"width":287.66,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/25-5.png","element":"img","alt":" ln(qmv4/s2) ≥ 2","inline":true,"padRight":true},{"text":"to simplify the bound. The bound follows.","element":"span"}]]},{"heading":"G Proof of Auxiliary Lemma for Lemma 2.4","paragraphs":[[{"text":"We prove Lemma ","element":"span"},{"href":"#id-63","style":{"fontStyle":"italic"},"text":"E.","element":"a"},{"text":"2","element":"span"},{"text":".","element":"span"}],[{"style":{"fontStyle":"italic"},"text":"Proof of Lemma ","element":"span"},{"href":"#id-63","style":{"fontStyle":"italic"},"text":"E.","element":"a"},{"text":"2","element":"span"},{"style":{"fontStyle":"italic"},"text":". ","element":"span"},{"text":"First, we show the following fact: Suppose that there are ","element":"span"},{"style":{"fontStyle":"italic"},"text":"T ","element":"span"},{"text":"distinguishable buckets and we want to a assign an ordered pair of ","element":"span"},{"text":"2 ","element":"span"},{"text":"unequal elements in ","element":"span"},{"text":"[","element":"span"},{"style":{"fontStyle":"italic"},"text":"N","element":"span"},{"text":"] ","element":"span"},{"text":"to each bucket so that the total number of times that any element ","element":"span"},{"style":{"height":16},"width":129.74,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/25-6.png","element":"img","alt":" i ∈ [N]","inline":true,"padRight":true},{"text":"shows up is ","element":"span"},{"style":{"height":12.8},"width":65.5,"height":32,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/25-7.png","element":"img","alt":" ≤ s","inline":true},{"text":". We show that the number of such assignments is at least ","element":"span"},{"style":{"height":13.38},"width":131.69,"height":33.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/25-8.png","element":"img","alt":"CT N 2T","inline":true,"padRight":true},{"text":"for some constant ","element":"span"},{"style":{"fontStyle":"italic"},"text":"C","element":"span"},{"text":". To prove this, we first consider the case where ","element":"span"},{"style":{"height":13.2},"width":143.06,"height":33,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/25-9.png","element":"img","alt":" N ≥ 2T","inline":true},{"text":". In this case, we have that the number of such assignments is at least:","element":"span"}],[{"style":{"width":"42%"},"width":811,"height":45,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/25-10.png","element":"img"}],[{"text":"Now, if ","element":"span"},{"style":{"fontStyle":"italic"},"text":"N < ","element":"span"},{"text":"2","element":"span"},{"style":{"fontStyle":"italic"},"text":"T","element":"span"},{"text":", then we define:","element":"span"}],[{"style":{"width":"23%"},"width":440,"height":90,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/25-11.png","element":"img"}],[{"text":"We partition ","element":"span"},{"text":"2","element":"span"},{"style":{"fontStyle":"italic"},"text":"T ","element":"span"},{"text":"into ","element":"span"},{"style":{"height":14.4},"width":23,"height":36,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/25-12.png","element":"img","alt":" β","inline":true,"padRight":true},{"text":"blocks, each of size ","element":"span"},{"style":{"fontStyle":"italic"},"text":"N","element":"span"},{"text":", until potentially the last block, which may be smaller. We can read off ordered pairs assigned to each bucket from this formulation. Let’s assume that each block is a permutation of ","element":"span"},{"text":"1","element":"span"},{"style":{"fontStyle":"italic"},"text":", . . . , N","element":"span"},{"text":", and the last block is ","element":"span"},{"style":{"height":16},"width":285.31,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/25-13.png","element":"img","alt":" 2T − (β − 1)(N)","inline":true,"padRight":true},{"text":"non-equal numbers drawn from ","element":"span"},{"text":"1","element":"span"},{"style":{"fontStyle":"italic"},"text":", . . . , N","element":"span"},{"text":". (this satisfies the unequal ordered pair condition). Then the number of assignments is ","element":"span"},{"style":{"height":17.78},"width":508.97,"height":44.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/25-14.png","element":"img","alt":" (N!)β−1 ·(N)(N −1) . . . (N −","inline":true},{"style":{"height":16},"width":404.71,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/25-15.png","element":"img","alt":"(2T − (β − 1)(N)) + 1)","inline":true},{"text":". This is at least as big as ","element":"span"},{"style":{"height":17.34},"width":147.57,"height":43.36,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/25-16.png","element":"img","alt":" C2T1 N 2T","inline":true,"padRight":true},{"text":"for some constant ","element":"span"},{"style":{"height":13.19},"width":44.48,"height":32.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/25-17.png","element":"img","alt":" C1","inline":true},{"text":".","element":"span"}],[{"style":{"width":"96%"},"width":1851,"height":41,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/26-0.png","element":"img"}],[{"style":{"height":13.2},"width":167.97,"height":33,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/26-1.png","element":"img","alt":"1 ≤ x ≤ s","inline":true},{"text":":","element":"span"}],[{"style":{"width":"53%"},"width":1029,"height":74,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/26-2.png","element":"img"}],[{"text":"We know that","element":"span"}],[{"style":{"width":"24%"},"width":475,"height":130,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/26-3.png","element":"img"}],[{"text":"where ","element":"span"},{"style":{"height":13.19},"width":38.14,"height":32.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/26-4.png","element":"img","alt":" Yr","inline":true,"padRight":true},{"text":"has expectation ","element":"span"},{"text":"0","element":"span"},{"text":". In this case we have that","element":"span"}],[{"style":{"width":"45%"},"width":869,"height":145,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/26-5.png","element":"img"}],[{"text":"where ","element":"span"},{"style":{"fontStyle":"italic"},"text":"Q ","element":"span"},{"text":"consists of terms that contain a factor of some ","element":"span"},{"style":{"height":13.19},"width":38.14,"height":32.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/26-6.png","element":"img","alt":" Yr","inline":true},{"text":". Due to the independence of the Rademachers, the expectation of any term that contains a factor of ","element":"span"},{"style":{"height":13.19},"width":38.14,"height":32.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/26-7.png","element":"img","alt":" Yr","inline":true,"padRight":true},{"text":"has expectation ","element":"span"},{"text":"0","element":"span"},{"text":", which implies that:","element":"span"}],[{"style":{"width":"75%"},"width":1448,"height":363,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/26-8.png","element":"img"}],[{"text":"We know that","element":"span"}],[{"style":{"width":"74%"},"width":1430,"height":378,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/26-9.png","element":"img"}],[{"text":"where ","element":"span"},{"style":{"height":14},"width":45.5,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/26-10.png","element":"img","alt":" Q′","inline":true,"padRight":true},{"text":"consists of terms that contain a factor of some ","element":"span"},{"style":{"height":14.74},"width":45.99,"height":36.85,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/26-11.png","element":"img","alt":" Y ′r","inline":true},{"text":". For similar reasons, this implies that","element":"span"}],[{"style":{"width":"52%"},"width":1005,"height":144,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/26-12.png","element":"img"}],[{"text":"Let’s view ","element":"span"},{"style":{"height":22.53},"width":256.84,"height":56.32,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/26-13.png","element":"img","alt":"�Tk=1 η′k,ikη′k,jk","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":20.4},"width":256.84,"height":51.01,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/26-14.png","element":"img","alt":" �Tk=1 ηk,ikηk,jk","inline":true,"padRight":true},{"text":"as terms in a sum. In the second expression, every term has ","element":"span"},{"text":"expectation","element":"span"},{"style":{"height":22.71},"width":113.26,"height":56.77,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/26-15.png","element":"img","alt":"� sm�2T","inline":true,"padRight":true},{"text":", and there are at most ","element":"span"},{"style":{"height":13.38},"width":75.25,"height":33.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/26-16.png","element":"img","alt":" N 2T","inline":true,"padRight":true},{"text":"terms. In the first expression, if there are ","element":"span"},{"style":{"fontStyle":"italic"},"text":"> s ","element":"span"},{"text":"copies of any ","element":"span"},{"style":{"height":12.79},"width":30.73,"height":31.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/26-17.png","element":"img","alt":" ik","inline":true,"padRight":true},{"text":"value, then the expectation is ","element":"span"},{"text":"0","element":"span"},{"text":". Otherwise, the expectation varies between ","element":"span"},{"style":{"height":22.71},"width":217.13,"height":56.77,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/26-18.png","element":"img","alt":" C−2T2 � sm�2T","inline":true,"padRight":true},{"text":"and","element":"span"},{"style":{"height":22.71},"width":113.25,"height":56.77,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/26-19.png","element":"img","alt":"� sm�2T","inline":true,"padRight":true},{"text":". By the counting argument at the beginning of the proof, we know that there are at least ","element":"span"},{"style":{"height":17.34},"width":147.57,"height":43.35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/26-20.png","element":"img","alt":" C2T1 N 2T","inline":true,"padRight":true},{"text":"terms. This implies ","element":"span"},{"text":"that","element":"span"}],[{"style":{"width":"51%"},"width":983,"height":42,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/26-21.png","element":"img"}],[{"text":"as desired.","element":"span"}],[{"style":{"width":"96%"},"width":1850,"height":41,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/26-22.png","element":"img"}],[{"text":"for ","element":"span"},{"style":{"height":13.2},"width":167.97,"height":33,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/26-23.png","element":"img","alt":" 1 ≤ x ≤ s","inline":true},{"text":":","element":"span"}],[{"style":{"width":"76%"},"width":1469,"height":228,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/26-24.png","element":"img"}],[{"text":"where ","element":"span"},{"style":{"height":13.19},"width":38.13,"height":32.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/27-0.png","element":"img","alt":" Yr","inline":true,"padRight":true},{"text":"has expectation ","element":"span"},{"style":{"height":13.2},"width":62.06,"height":33,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/27-1.png","element":"img","alt":" ≥ 0","inline":true},{"text":". In this case we have that","element":"span"}],[{"style":{"width":"56%"},"width":1082,"height":144,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/27-2.png","element":"img"}],[{"text":"where ","element":"span"},{"style":{"fontStyle":"italic"},"text":"Q ","element":"span"},{"text":"has expectation ","element":"span"},{"style":{"height":13.2},"width":62.06,"height":33,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/27-3.png","element":"img","alt":" ≥ 0","inline":true},{"text":". This implies that:","element":"span"}],[{"style":{"width":"87%"},"width":1674,"height":818,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/27-4.png","element":"img"}],[{"text":"where ","element":"span"},{"style":{"height":14},"width":45.5,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/27-5.png","element":"img","alt":" Q′","inline":true,"padRight":true},{"text":"consists of terms that contain a factor of some ","element":"span"},{"style":{"height":14.74},"width":45.99,"height":36.85,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/27-6.png","element":"img","alt":" Y ′r","inline":true},{"text":". For similar reasons to the above, we have that:","element":"span"}],[{"style":{"width":"65%"},"width":1257,"height":145,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/27-7.png","element":"img"}],[{"text":"Let’s view ","element":"span"},{"style":{"height":21.2},"width":347.19,"height":53.01,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/27-8.png","element":"img","alt":"�Tk=1 (ηk,ikηk,jk)q/T","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":33.1},"width":471.46,"height":82.74,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/27-9.png","element":"img","alt":" �Tk=1�η′k,ikη′k,jkIM ′k=2�q/T","inline":true,"padRight":true},{"text":"as terms in a sum. In the second expression, every term has expectation ","element":"span"},{"style":{"height":22.71},"width":158.11,"height":56.77,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/27-10.png","element":"img","alt":" ≤� sm�2T","inline":true,"padRight":true},{"text":"(the indicator can only ","element":"span"},{"style":{"fontStyle":"italic"},"text":"reduce ","element":"span"},{"text":"the expectation), and there are at most ","element":"span"},{"style":{"height":13.38},"width":75.25,"height":33.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/27-11.png","element":"img","alt":"N 2T","inline":true,"padRight":true},{"text":"terms. In the first expression, if there are ","element":"span"},{"style":{"fontStyle":"italic"},"text":"> s ","element":"span"},{"text":"copies of any ","element":"span"},{"style":{"height":12.79},"width":30.73,"height":31.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/27-12.png","element":"img","alt":" ik","inline":true,"padRight":true},{"text":"value, then the expectation is ","element":"span"},{"text":"0","element":"span"},{"text":". Otherwise, the expectation varies between ","element":"span"},{"style":{"height":22.7},"width":217.12,"height":56.76,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/27-13.png","element":"img","alt":" C−2T2 � sm�2T","inline":true,"padRight":true},{"text":"and","element":"span"},{"style":{"height":22.7},"width":113.25,"height":56.76,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/27-14.png","element":"img","alt":"� sm�2T","inline":true,"padRight":true},{"text":". By the counting argument, we know that there are at least ","element":"span"},{"style":{"height":18.67},"width":172.47,"height":46.67,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/27-15.png","element":"img","alt":" C−2T1 N 2T","inline":true,"padRight":true},{"text":"terms. This implies that","element":"span"}],[{"style":{"width":"83%"},"width":1605,"height":69,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/27-16.png","element":"img"}],[{"text":"as desired.","element":"span"}]]},{"heading":"H Proof of Lemma 3.1 and Lemma 3.2","paragraphs":[[{"text":"Recall that our proof of Theorem ","element":"span"},{"href":"#id-25","text":"1.5 ","element":"a"},{"text":"requires cleaner bounds on moments of ","element":"span"},{"style":{"height":19.18},"width":290.09,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/27-17.png","element":"img","alt":" ∥R(x1, . . . , xn)∥q","inline":true,"padRight":true},{"text":"that follow simplifying the bounds in Lemma ","element":"span"},{"href":"#id-36","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"3 ","element":"span"},{"text":"and Lemma ","element":"span"},{"href":"#id-37","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"4 ","element":"span"},{"text":"at the target values of ","element":"span"},{"style":{"fontStyle":"italic"},"text":"v","element":"span"},{"text":". The proofs of these lemmas boil down to function bounding and simplification.","element":"span"}],[{"style":{"fontWeight":"bold"},"text":"H.1 ","element":"span"},{"style":{"fontWeight":"bold"},"text":"Proof of Lemma ","element":"span"},{"href":"#id-38","style":{"fontWeight":"bold"},"text":"3.1","element":"a"}],[{"text":"First, we show how Lemma ","element":"span"},{"href":"#id-36","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"3 ","element":"span"},{"text":"implies Lemma ","element":"span"},{"href":"#id-38","text":"3","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"1","element":"span"},{"text":". The proof involves simplifying and bounding the function at the target ","element":"span"},{"style":{"fontStyle":"italic"},"text":"v ","element":"span"},{"text":"value.","element":"span"}],[{"style":{"fontStyle":"italic"},"text":"Proof of Lemma ","element":"span"},{"href":"#id-38","text":"3","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"1","element":"span"},{"style":{"fontStyle":"italic"},"text":". ","element":"span"},{"text":"We plug ","element":"span"},{"style":{"fontStyle":"italic"},"text":"q ","element":"span"},{"text":"= ","element":"span"},{"style":{"fontStyle":"italic"},"text":"p ","element":"span"},{"text":"into Lemma ","element":"span"},{"href":"#id-36","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"3","element":"span"},{"text":". We use this relaxed version of the bound: If ","element":"span"},{"style":{"height":16.57},"width":142.29,"height":41.43,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-0.png","element":"img","alt":"semv2 ≥ q","inline":true},{"text":", ","element":"span"},{"text":"then ","element":"span"},{"style":{"height":25.21},"width":404.78,"height":63.03,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-1.png","element":"img","alt":" ∥R(x1, . . . , xn)∥q ≲ √q√m","inline":true},{"text":". Otherwise, if there exists ","element":"span"},{"style":{"height":16.59},"width":244.88,"height":41.47,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-2.png","element":"img","alt":" C2q3mv4 ≥ s2","inline":true},{"text":", then","element":"span"}],[{"style":{"width":"88%"},"width":1697,"height":192,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-3.png","element":"img"}],[{"text":"Suppose that the absolute constant on the upper bounds is ","element":"span"},{"style":{"height":13.2},"width":94.61,"height":33,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-4.png","element":"img","alt":" ≤ C′","inline":true},{"text":". Let ","element":"span"},{"style":{"height":16},"width":284.71,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-5.png","element":"img","alt":" C = max(C′, 1)","inline":true,"padRight":true},{"text":"(we take ","element":"span"},{"style":{"fontStyle":"italic"},"text":"C ","element":"span"},{"text":"to be the constant on the upper bounds). ","element":"span"},{"text":"Let’s take ","element":"span"},{"style":{"height":23.13},"width":208.82,"height":57.83,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-6.png","element":"img","alt":" Cv,2 = 0.25√C","inline":true,"padRight":true},{"text":", ","element":"span"},{"style":{"height":20.02},"width":782.61,"height":50.05,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-7.png","element":"img","alt":" Cv,1 = min� 0.1C3/2 , Cv,2�, CS = 4C, CM =","inline":true}],[{"style":{"width":"99%"},"width":1908,"height":236,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-8.png","element":"img"}],[{"text":"First, let’s analyze ","element":"span"},{"style":{"height":14},"width":109.39,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-9.png","element":"img","alt":" v = f2","inline":true},{"text":". We show that ","element":"span"},{"style":{"height":17.38},"width":290.54,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-10.png","element":"img","alt":" ln(pmf 42 /s2) ≥ 2","inline":true},{"text":". Observe that ","element":"span"},{"style":{"height":21.08},"width":636.25,"height":52.71,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-11.png","element":"img","alt":" ln(pmf 42 /s2) = ln(C4v,2 ln2(mϵ2/p))+","inline":true}],[{"style":{"height":17.38},"width":173.72,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-12.png","element":"img","alt":"ln(mϵ2/p)","inline":true},{"text":". Using the fact that ","element":"span"},{"style":{"height":12.8},"width":107.12,"height":32,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-13.png","element":"img","alt":" m ≥ e","inline":true}],[{"style":{"width":"29%"},"width":559,"height":98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-14.png","element":"img"}],[{"text":"Now, since ","element":"span"},{"style":{"height":16.58},"width":205.52,"height":41.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-15.png","element":"img","alt":" m ≥ e2ϵ−2p","inline":true},{"text":", this implies that","element":"span"}],[{"style":{"width":"59%"},"width":1134,"height":53,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-16.png","element":"img"}],[{"text":"Moreover, we know that ","element":"span"},{"style":{"height":17.34},"width":210.42,"height":43.35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-17.png","element":"img","alt":" p3mf 22 ≥ s2","inline":true},{"text":", since ","element":"span"},{"style":{"height":16.58},"width":225.92,"height":41.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-18.png","element":"img","alt":" pmv4 ≥ e2s2","inline":true},{"text":". Now, we show that ","element":"span"},{"style":{"height":27.95},"width":390.75,"height":69.88,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-19.png","element":"img","alt":" C pf 22s ln(pmf 42 /s2) ≤ 0.25ϵ","inline":true},{"text":". Let’s ","element":"span"},{"text":"observe that","element":"span"}],[{"style":{"width":"69%"},"width":1326,"height":214,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-20.png","element":"img"}],[{"text":"Now, we handle the case where ","element":"span"},{"style":{"height":12.8},"width":140.65,"height":32,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-21.png","element":"img","alt":" m ≥ s·e","inline":true}],[{"text":"using that ","element":"span"},{"style":{"height":12.8},"width":126.06,"height":32,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-22.png","element":"img","alt":" m ≥ se","inline":true},{"text":", this immediately follows from ","element":"span"},{"style":{"height":20.21},"width":360.04,"height":50.52,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-23.png","element":"img","alt":"ps ln(m/s) ≤ ps ≤ 0.25ϵ","inline":true},{"text":". Otherwise, we need it to be true that ","element":"span"},{"style":{"height":17.38},"width":359.08,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-24.png","element":"img","alt":"s ln(m/s) ≥ 4Cpϵ−1","inline":true},{"text":". This can be written as ","element":"span"},{"style":{"height":23.02},"width":316.14,"height":57.54,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-25.png","element":"img","alt":" ln(m/s) ≥ 4Cpϵ−1s","inline":true,"padRight":true},{"text":". Since ","element":"span"},{"style":{"height":13.19},"width":170.05,"height":32.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-26.png","element":"img","alt":" CS = 4C","inline":true},{"text":", this can be written as:","element":"span"}],[{"style":{"fontStyle":"italic"},"text":"m ","element":"span"},{"style":{"height":12.8},"width":78.14,"height":32,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-27.png","element":"img","alt":" ≥ s ·","inline":true,"padRight":true},{"style":{"fontStyle":"italic"},"text":"e","element":"span"}],[{"style":{"height":14},"width":109.39,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-28.png","element":"img","alt":"v = f2","inline":true},{"text":":","element":"span"}],[{"style":{"width":"96%"},"width":1851,"height":377,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-29.png","element":"img"}],[{"text":"only exist if ","element":"span"},{"style":{"height":17.38},"width":328,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-30.png","element":"img","alt":" s ≤ Θ(ϵ−1 ln(1/δ))","inline":true},{"text":". Observe that we can set ","element":"span"},{"style":{"height":24.89},"width":170.18,"height":62.22,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-31.png","element":"img","alt":" C2 = 1C4v,1","inline":true,"padRight":true},{"text":"and using the fact that ","element":"span"},{"style":{"height":15.59},"width":201.6,"height":38.97,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-32.png","element":"img","alt":" Cv,1 ≤ Cv,2","inline":true},{"text":", we ","element":"span"},{"text":"obtain that","element":"span"}],[{"style":{"width":"64%"},"width":1229,"height":91,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-33.png","element":"img"}],[{"text":"Thus, this is lower bounded by ","element":"span"},{"text":"1 ","element":"span"},{"text":"when ","element":"span"},{"style":{"height":24.89},"width":165.37,"height":62.22,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/28-34.png","element":"img","alt":" C2 = 1C4v,1","inline":true,"padRight":true},{"text":".","element":"span"}],[{"text":"First, we analyze the case of ","element":"span"},{"style":{"height":14},"width":109.4,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-0.png","element":"img","alt":" v = f1","inline":true},{"text":". We show that ","element":"span"},{"style":{"height":28.95},"width":324.97,"height":72.38,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-1.png","element":"img","alt":"CC1/32 p2v2s ln2(pmv2/s) ≤ 0.1ϵ","inline":true},{"text":". Observe that","element":"span"}],[{"style":{"width":"99%"},"width":1908,"height":406,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-2.png","element":"img"}],[{"text":"where the last inequality uses the fact that ","element":"span"},{"style":{"height":20.02},"width":197.72,"height":50.04,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-3.png","element":"img","alt":" Cv,1 ≤ 0.1C3/2","inline":true,"padRight":true},{"text":".","element":"span"}],[{"style":{"width":"96%"},"width":1852,"height":41,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-4.png","element":"img"}],[{"text":"bound if ","element":"span"},{"style":{"height":17.38},"width":289.91,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-5.png","element":"img","alt":" ln(pmv4/s2) ≥ 2","inline":true},{"text":". First, we show this is an increasing function of ","element":"span"},{"style":{"fontStyle":"italic"},"text":"v","element":"span"},{"text":". Let ","element":"span"},{"style":{"height":17.38},"width":233.43,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-6.png","element":"img","alt":" w = pmv4/s2","inline":true},{"text":". We see that","element":"span"}],[{"style":{"height":11.6},"width":49.18,"height":29,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-7.png","element":"img","alt":"√w","inline":true},{"style":{"height":7.6},"width":55.07,"height":19,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-8.png","element":"img","alt":"ln w","inline":true},{"text":". We observe that this is an increasing function of ","element":"span"},{"style":{"fontStyle":"italic"},"text":"w ","element":"span"},{"text":"as long as ","element":"span"},{"style":{"height":15.78},"width":117.29,"height":39.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-9.png","element":"img","alt":" w ≥ e2","inline":true},{"text":", which is exactly","element":"span"}],[{"style":{"width":"99%"},"width":1910,"height":131,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-10.png","element":"img"}],[{"text":"if ","element":"span"},{"style":{"height":17.38},"width":273.31,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-11.png","element":"img","alt":" ln(pmv2/s) ≥ 1","inline":true},{"text":". First, we show that ","element":"span"},{"style":{"height":16},"width":239.53,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-12.png","element":"img","alt":" f(v) ≤ 2f(v′)","inline":true,"padRight":true},{"text":"if ","element":"span"},{"style":{"height":12.8},"width":112.33,"height":32,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-13.png","element":"img","alt":" v ≤ v′","inline":true},{"text":". Let ","element":"span"},{"style":{"height":17.38},"width":219.02,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-14.png","element":"img","alt":" w = pmv2/s","inline":true},{"text":". We see that ","element":"span"},{"style":{"height":25.82},"width":229.28,"height":64.54,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-15.png","element":"img","alt":"p2v2s ln(pmv2/s) =","inline":true}],[{"style":{"width":"99%"},"width":1906,"height":37,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-16.png","element":"img"}],[{"text":"this is bounded by at most a factor of ","element":"span"},{"text":"2 ","element":"span"},{"text":"above any other ","element":"span"},{"style":{"fontStyle":"italic"},"text":"w ","element":"span"},{"text":"value.","element":"span"}],[{"style":{"width":"96%"},"width":1852,"height":111,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-17.png","element":"img"}],[{"text":"that ","element":"span"},{"style":{"height":19.18},"width":436.67,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-18.png","element":"img","alt":" ∥R(x1, . . . , xn)∥q ≤ 0.25ϵ","inline":true},{"text":".","element":"span"}],[{"style":{"width":"73%"},"width":1405,"height":223,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-19.png","element":"img"}],[{"text":"Otherwise, we know that ","element":"span"},{"style":{"height":17.39},"width":293.49,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-20.png","element":"img","alt":" ln(pmv4/s2) > 2","inline":true},{"text":". First let’s show that that ","element":"span"},{"style":{"height":25.82},"width":387.02,"height":64.54,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-21.png","element":"img","alt":" C pv2s ln(pmv4/s2) ≤ 0.25ϵ","inline":true},{"text":". We know that ","element":"span"},{"style":{"height":14},"width":117.49,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-22.png","element":"img","alt":"v ≤ f2","inline":true},{"text":". At ","element":"span"},{"style":{"height":14},"width":117.49,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-23.png","element":"img","alt":" v = f2","inline":true},{"text":", we know that the expression is upper bounded by ","element":"span"},{"style":{"height":11.2},"width":90.84,"height":28,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-24.png","element":"img","alt":" 0.25ϵ","inline":true},{"text":". Since the ","element":"span"},{"style":{"height":25.82},"width":195.68,"height":64.54,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-25.png","element":"img","alt":"pv2s ln(pmv4/s2)","inline":true,"padRight":true},{"text":"term is ","element":"span"},{"text":"an increasing function of ","element":"span"},{"style":{"fontStyle":"italic"},"text":"v ","element":"span"},{"text":"in this regime, this means that we get a bound of ","element":"span"},{"style":{"height":11.2},"width":90.85,"height":28,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-26.png","element":"img","alt":" 0.25ϵ","inline":true,"padRight":true},{"text":"in this case too. Thus, we know that:","element":"span"}],[{"style":{"width":"75%"},"width":1450,"height":310,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-27.png","element":"img"}],[{"text":"Now, suppose that ","element":"span"},{"style":{"height":14},"width":119.02,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-28.png","element":"img","alt":" v = f2","inline":true},{"text":". We’ve already shown that ","element":"span"},{"style":{"height":17.39},"width":297.11,"height":43.47,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-29.png","element":"img","alt":" ln(pmv4/s2) ≥ 2","inline":true,"padRight":true},{"text":"here (near the beginning of the proof). Since ","element":"span"},{"style":{"height":14},"width":109.39,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-30.png","element":"img","alt":" v ≤ f1","inline":true},{"text":", we obtain a bound of ","element":"span"},{"style":{"height":10.8},"width":239.86,"height":27,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-31.png","element":"img","alt":" 2 · 0.1ϵ = 0.2ϵ","inline":true},{"text":". This means:","element":"span"}],[{"style":{"width":"87%"},"width":1682,"height":383,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/29-32.png","element":"img"}],[{"style":{"fontWeight":"bold"},"text":"H.2 ","element":"span"},{"style":{"fontWeight":"bold"},"text":"Proof of Lemma ","element":"span"},{"href":"#id-39","style":{"fontWeight":"bold"},"text":"3.2","element":"a"}],[{"text":"Now, we show how Lemma ","element":"span"},{"href":"#id-36","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"3 ","element":"span"},{"text":"and Lemma ","element":"span"},{"href":"#id-37","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"4 ","element":"span"},{"text":"imply Lemma ","element":"span"},{"href":"#id-39","text":"3","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"2","element":"span"},{"text":". The proof simply involves bounding and simplifying the functions in the original lemmas at the target ","element":"span"},{"style":{"fontStyle":"italic"},"text":"v ","element":"span"},{"text":"value.","element":"span"}],[{"style":{"fontStyle":"italic"},"text":"Proof of Lemma ","element":"span"},{"href":"#id-39","text":"3","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"2","element":"span"},{"style":{"fontStyle":"italic"},"text":". ","element":"span"},{"text":"We use Lemma ","element":"span"},{"href":"#id-36","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"3 ","element":"span"},{"text":"but put in an absolute constant. Let ","element":"span"},{"style":{"height":13.19},"width":124,"height":32.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-0.png","element":"img","alt":" D2 > 0","inline":true,"padRight":true},{"text":"be such that: if ","element":"span"},{"style":{"height":16.57},"width":137.69,"height":41.43,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-1.png","element":"img","alt":"semv2 ≥ q","inline":true},{"text":", ","element":"span"},{"text":"then","element":"span"}],[{"style":{"width":"24%"},"width":478,"height":81,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-2.png","element":"img"}],[{"text":"Otherwise, if ","element":"span"},{"style":{"height":16.59},"width":198.52,"height":41.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-3.png","element":"img","alt":" q3mv4 ≥ s2","inline":true},{"text":", then ","element":"span"},{"style":{"height":19.18},"width":290.08,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-4.png","element":"img","alt":" ∥R(x1, . . . , xn)∥q","inline":true,"padRight":true},{"text":"is upper bounded by:","element":"span"}],[{"style":{"width":"82%"},"width":1568,"height":249,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-5.png","element":"img"}],[{"text":"We use Lemma ","element":"span"},{"href":"#id-37","text":"2","element":"a"},{"style":{"fontStyle":"italic"},"text":".","element":"span"},{"text":"4 ","element":"span"},{"text":"but put in an absolute constant ","element":"span"},{"style":{"height":13.19},"width":125.62,"height":32.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-6.png","element":"img","alt":" D1 > 0","inline":true,"padRight":true},{"text":"(which we take to be ","element":"span"},{"style":{"height":13.2},"width":62.88,"height":33,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-7.png","element":"img","alt":" ≤ 1","inline":true},{"text":"). Let ","element":"span"},{"style":{"height":14},"width":183.65,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-8.png","element":"img","alt":" 2 ≤ q ≤ m","inline":true,"padRight":true},{"text":"be an even integer, and suppose that ","element":"span"},{"style":{"height":13.6},"width":197.93,"height":34,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-9.png","element":"img","alt":" 0 < v ≤ 0.5","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":19.37},"width":30.94,"height":48.43,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-10.png","element":"img","alt":"1v2","inline":true,"padRight":true},{"text":"is an even integer. If ","element":"span"},{"style":{"height":16.59},"width":129.98,"height":41.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-11.png","element":"img","alt":" qv2 ≤ s","inline":true},{"text":", then","element":"span"}],[{"style":{"width":"24%"},"width":478,"height":93,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-12.png","element":"img"}],[{"text":"If ","element":"span"},{"style":{"fontStyle":"italic"},"text":"m ","element":"span"},{"style":{"height":12.8},"width":31,"height":32,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-13.png","element":"img","alt":" ≥","inline":true,"padRight":true},{"style":{"fontStyle":"italic"},"text":"q","element":"span"},{"text":", ","element":"span"},{"style":{"height":16},"width":122.29,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-14.png","element":"img","alt":" 2 ≤ ln(","inline":true},{"style":{"fontStyle":"italic"},"text":"qmv","element":"span"},{"style":{"height":17.38},"width":131.92,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-15.png","element":"img","alt":"4/s2) ≤","inline":true,"padRight":true},{"style":{"fontStyle":"italic"},"text":"q","element":"span"},{"text":", ","element":"span"},{"style":{"height":17.38},"width":256.38,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-16.png","element":"img","alt":" 2qv2 ≤ 0.5s ln(","inline":true},{"style":{"fontStyle":"italic"},"text":"qmv","element":"span"},{"style":{"height":17.38},"width":90.36,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-17.png","element":"img","alt":"4/s2)","inline":true},{"text":", and ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"style":{"height":12.8},"width":31,"height":32,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-18.png","element":"img","alt":" ≤","inline":true,"padRight":true},{"style":{"fontStyle":"italic"},"text":"m/e ","element":"span"},{"text":"then:","element":"span"}],[{"style":{"width":"99%"},"width":1910,"height":586,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-19.png","element":"img"}],[{"text":"First, we handle the case where ","element":"span"},{"style":{"height":17.38},"width":349.41,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-20.png","element":"img","alt":" m ≤ Θ(ϵ−2 ln(1/δ))","inline":true},{"text":". Let’s take ","element":"span"},{"style":{"height":14},"width":109.79,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-21.png","element":"img","alt":" v = ψ","inline":true,"padRight":true},{"text":"for any sufficiently small ","element":"span"},{"style":{"height":14},"width":26,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-22.png","element":"img","alt":" ψ","inline":true},{"text":". By sufficiently small, we mean ","element":"span"},{"style":{"height":21.28},"width":155.71,"height":53.2,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-23.png","element":"img","alt":" v2 ≤ se2mq","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":13.6},"width":197.93,"height":34,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-24.png","element":"img","alt":" 0 < v ≤ 0.5","inline":true},{"text":". This implies that ","element":"span"},{"style":{"height":16.57},"width":157.61,"height":41.44,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-25.png","element":"img","alt":"semv2 ≥ 2q","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":16.58},"width":129.98,"height":41.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-26.png","element":"img","alt":" qv2 ≤ s","inline":true},{"text":". Thus we know","element":"span"}],[{"text":"(using that ","element":"span"},{"style":{"fontStyle":"italic"},"text":"q ","element":"span"},{"style":{"height":12.8},"width":31,"height":32,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-27.png","element":"img","alt":" ≤","inline":true,"padRight":true},{"style":{"fontStyle":"italic"},"text":"m","element":"span"},{"text":") that ","element":"span"},{"style":{"height":16},"width":104.77,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-28.png","element":"img","alt":" ∥R(x1","inline":true},{"style":{"fontStyle":"italic"},"text":", . . . , x","element":"span"},{"style":{"height":19.18},"width":192.72,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-29.png","element":"img","alt":"n)∥2q ≤ D2","inline":true}],[{"style":{"width":"28%"},"width":541,"height":108,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-30.png","element":"img"}],[{"text":"as desired. Suppose that ","element":"span"},{"style":{"height":17.38},"width":339.49,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-31.png","element":"img","alt":" m ≤ Θ(ϵ−2 ln(1/δ))","inline":true},{"text":". Based on the setting ","element":"span"},{"style":{"fontStyle":"italic"},"text":"q","element":"span"},{"text":", this means that ","element":"span"},{"style":{"height":19.18},"width":426.18,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-32.png","element":"img","alt":" ∥R(v, . . . , v, 0 . . . , 0)∥q ≥","inline":true}],[{"style":{"width":"99%"},"width":1910,"height":99,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-33.png","element":"img"}],[{"text":"us to assume that ","element":"span"},{"style":{"height":17.38},"width":323.19,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-34.png","element":"img","alt":" s ≤ Θ(ϵ−1 ln(1/δ))","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":15.78},"width":182.64,"height":39.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-35.png","element":"img","alt":" m ≤ ϵ−2ep","inline":true},{"text":". Let ","element":"span"},{"style":{"height":26.63},"width":280.62,"height":66.58,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-36.png","element":"img","alt":" f1 = 4√ϵsln( mϵq )q","inline":true,"padRight":true},{"text":"and let ","element":"span"},{"style":{"height":16},"width":158.91,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-37.png","element":"img","alt":" f2 = √ϵs","inline":true}],[{"text":"consider ","element":"span"},{"style":{"height":15.59},"width":283.56,"height":38.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-38.png","element":"img","alt":" v = Cv,1f1 =: v1","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":15.59},"width":283.55,"height":38.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-39.png","element":"img","alt":" v = Cv,2f2 =: v2","inline":true},{"text":". First, we handle the condition of ","element":"span"},{"style":{"height":16.58},"width":198.52,"height":41.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-40.png","element":"img","alt":" q3mv4 ≥ s2","inline":true},{"text":". We enforce the condition ","element":"span"},{"style":{"height":15.59},"width":240.91,"height":38.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-41.png","element":"img","alt":" Cv,1, Cv,2 ≥ 1","inline":true},{"text":". Assuming that ","element":"span"},{"style":{"height":24.25},"width":137.66,"height":60.64,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-42.png","element":"img","alt":" v ≥√ϵsq","inline":true,"padRight":true},{"text":"(which is true at the two values of ","element":"span"},{"style":{"fontStyle":"italic"},"text":"v ","element":"span"},{"text":"that we consider), we","element":"span"}],[{"text":"know ","element":"span"},{"style":{"height":25.42},"width":289.66,"height":63.55,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-43.png","element":"img","alt":"q3mv4s2 ≥ mϵ2q ≥ 1","inline":true},{"text":". Also, we make ","element":"span"},{"style":{"height":16.58},"width":235.22,"height":41.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-44.png","element":"img","alt":" m ≥ 2C2ϵ−2q","inline":true},{"text":", so that","element":"span"},{"style":{"height":28.8},"width":40,"height":72,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-45.png","element":"img","alt":"�","inline":true}],[{"text":"Consider ","element":"span"},{"style":{"height":9.19},"width":124.55,"height":22.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-46.png","element":"img","alt":" v = v2","inline":true},{"text":". We first check that the conditions for the upper bound are satisfied. We have that","element":"span"}],[{"style":{"width":"99%"},"width":1907,"height":54,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/30-47.png","element":"img"}],[{"style":{"height":17.38},"width":296.83,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-0.png","element":"img","alt":"ln(qmv4/s2) ≥ 2","inline":true},{"text":". Also, we have that ","element":"span"},{"style":{"height":28.8},"width":271.88,"height":72,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-1.png","element":"img","alt":"qmv2se = √qm�","inline":true}],[{"text":"needed for the lower bound. Observe that","element":"span"}],[{"style":{"width":"59%"},"width":1138,"height":95,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-2.png","element":"img"}],[{"text":"as desired. We check that ","element":"span"},{"style":{"height":17.39},"width":285.65,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-3.png","element":"img","alt":" ln(qmv4/s2) ≤ q","inline":true},{"text":". It suffices to show that","element":"span"}],[{"style":{"width":"21%"},"width":420,"height":104,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-4.png","element":"img"}],[{"text":"Using the condition that ","element":"span"},{"style":{"height":25.7},"width":228.57,"height":64.24,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-5.png","element":"img","alt":" m ≤ ϵ−2 eqqC4v,2","inline":true,"padRight":true},{"text":"where we obtain that","element":"span"}],[{"style":{"width":"54%"},"width":1050,"height":104,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-6.png","element":"img"}],[{"text":"as desired. Now, we compute the value of ","element":"span"},{"style":{"height":25.82},"width":194.86,"height":64.54,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-7.png","element":"img","alt":"qv2s ln(qmv4/s2)","inline":true,"padRight":true},{"text":"at ","element":"span"},{"style":{"height":15.59},"width":182.16,"height":38.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-8.png","element":"img","alt":" v = Cv,2f2","inline":true},{"text":". We obtain:","element":"span"}],[{"style":{"width":"96%"},"width":1850,"height":201,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-9.png","element":"img"}],[{"text":"that ","element":"span"},{"style":{"height":25.42},"width":439.45,"height":63.54,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-10.png","element":"img","alt":"qmv2s = 16C2v,1mϵq ln2( mϵq )","inline":true},{"text":". Observe that when ","element":"span"},{"style":{"height":15.59},"width":146.96,"height":38.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-11.png","element":"img","alt":" Cv,1 ≥ 1","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":16.58},"width":372.38,"height":41.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-12.png","element":"img","alt":" m ≥ e2ϵ−2q ≥ e2ϵ−1q","inline":true},{"text":", this is lower bounded ","element":"span"},{"text":"by ","element":"span"},{"style":{"height":13.38},"width":34.56,"height":33.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-13.png","element":"img","alt":" e2","inline":true},{"text":", so ","element":"span"},{"style":{"height":17.38},"width":274.26,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-14.png","element":"img","alt":" ln(qmv2/s) ≥ 2","inline":true},{"text":". Now, we claim that when ","element":"span"},{"style":{"height":14},"width":131.52,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-15.png","element":"img","alt":" f1 ≤ f2","inline":true},{"text":", we show that ","element":"span"},{"style":{"height":17.38},"width":313.4,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-16.png","element":"img","alt":" ln(qmv2/s) ≤ q/2","inline":true},{"text":". In this case, using that ","element":"span"},{"style":{"height":16.58},"width":199.86,"height":41.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-17.png","element":"img","alt":" m ≤ ϵ−2qeq","inline":true},{"text":", we have: ","element":"span"},{"style":{"height":24.03},"width":193.21,"height":60.07,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-18.png","element":"img","alt":"4 ln(mϵ/q)q ≤","inline":true}],[{"text":"Observe that","element":"span"}],[{"style":{"width":"46%"},"width":894,"height":226,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-19.png","element":"img"}],[{"text":"At this value, observe that:","element":"span"}],[{"style":{"width":"57%"},"width":1095,"height":158,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-20.png","element":"img"}],[{"text":"Let ","element":"span"},{"style":{"height":13.19},"width":139.26,"height":32.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-21.png","element":"img","alt":" C = D1","inline":true},{"text":". Let’s set","element":"span"},{"style":{"height":28.8},"width":40,"height":72,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-22.png","element":"img","alt":"�","inline":true}],[{"style":{"height":7.6},"width":24,"height":19,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-23.png","element":"img","alt":"C","inline":true,"padRight":true},{"text":". Using the fact that ","element":"span"},{"style":{"height":15.79},"width":148.55,"height":39.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-24.png","element":"img","alt":" v2 ≤ 0.5","inline":true,"padRight":true},{"text":"(so ","element":"span"},{"style":{"height":19.37},"width":116.2,"height":48.43,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-25.png","element":"img","alt":"1v2 ≥ 2","inline":true},{"text":"), this ","element":"span"},{"text":"means that ","element":"span"},{"style":{"height":19.37},"width":30.94,"height":48.43,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-26.png","element":"img","alt":"1v2","inline":true,"padRight":true},{"text":"has can take on at least ","element":"span"},{"text":"3 ","element":"span"},{"text":"different powers of ","element":"span"},{"text":"2","element":"span"},{"text":". Let’s observe that when ","element":"span"},{"style":{"height":22.62},"width":334.95,"height":56.56,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-27.png","element":"img","alt":" 16C2v ln2( mϵq ) ≤ mϵq","inline":true,"padRight":true},{"text":"(we can get this condition by saying that ","element":"span"},{"style":{"height":18.17},"width":253.57,"height":45.44,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-28.png","element":"img","alt":" m ≥ CM,2ϵ−2q","inline":true,"padRight":true},{"text":"for a sufficiently large ","element":"span"},{"style":{"height":15.59},"width":85.61,"height":38.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-29.png","element":"img","alt":" CM,2","inline":true},{"text":") and ","element":"span"},{"style":{"height":18.73},"width":341.23,"height":46.82,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-30.png","element":"img","alt":" 16C2v ln2(mϵ/q) ≥ 1","inline":true,"padRight":true},{"text":"(we can get this condition by saying that ","element":"span"},{"style":{"height":18.17},"width":253.57,"height":45.44,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-31.png","element":"img","alt":" m ≥ CM,2ϵ−2q","inline":true,"padRight":true},{"text":"for a sufficiently large ","element":"span"},{"style":{"height":15.59},"width":85.61,"height":38.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-32.png","element":"img","alt":" CM,2","inline":true},{"text":"), we know that","element":"span"}],[{"style":{"width":"41%"},"width":787,"height":102,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-33.png","element":"img"}],[{"text":"Suppose that ","element":"span"},{"style":{"height":24.58},"width":361.75,"height":61.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-34.png","element":"img","alt":" C4v ln2(mϵ2/q) ≤ mϵ2q","inline":true,"padRight":true},{"text":"(we can get this condition by saying that ","element":"span"},{"style":{"height":18.18},"width":255.73,"height":45.44,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-35.png","element":"img","alt":" m ≥ CM,2ϵ−2q","inline":true,"padRight":true},{"text":"for a sufficiently large ","element":"span"},{"style":{"height":15.59},"width":85.61,"height":38.97,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-36.png","element":"img","alt":" CM,2","inline":true},{"text":") and ","element":"span"},{"style":{"height":18.73},"width":321.02,"height":46.82,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-37.png","element":"img","alt":" C4v ln2(mϵ2/q) ≥ 1","inline":true,"padRight":true},{"text":"(we can get this condition by saying that ","element":"span"},{"style":{"height":18.17},"width":255.34,"height":45.44,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-38.png","element":"img","alt":" m ≥ CM,2ϵ−2q","inline":true,"padRight":true},{"text":"for a sufficiently ","element":"span"},{"text":"large ","element":"span"},{"style":{"height":15.59},"width":85.61,"height":38.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-39.png","element":"img","alt":" CM,2","inline":true},{"text":"). Let’s observe that","element":"span"}],[{"style":{"width":"43%"},"width":828,"height":102,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/31-40.png","element":"img"}],[{"text":"Let ","element":"span"},{"style":{"height":19.75},"width":268.73,"height":49.38,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-0.png","element":"img","alt":" m′ = s · eCϵ−1q1024s","inline":true,"padRight":true},{"text":". When ","element":"span"},{"style":{"height":12.8},"width":147.87,"height":32,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-1.png","element":"img","alt":" m ≥ m′","inline":true},{"text":", we know that ","element":"span"},{"style":{"height":22.17},"width":282.66,"height":55.44,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-2.png","element":"img","alt":"qs ln(m/s) ≤ 1024ϵC","inline":true,"padRight":true},{"text":"and when ","element":"span"},{"style":{"height":12.8},"width":147.87,"height":32,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-3.png","element":"img","alt":" m ≤ m′","inline":true},{"text":", we know that ","element":"span"},{"style":{"height":22.17},"width":271.9,"height":55.43,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-4.png","element":"img","alt":"qs ln(m/s) ≥ 1024ϵC","inline":true,"padRight":true},{"text":".","element":"span"}],[{"text":"In order to plug in ","element":"span"},{"style":{"height":9.19},"width":113.3,"height":22.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-5.png","element":"img","alt":" v = v1","inline":true,"padRight":true},{"text":"and use the ","element":"span"},{"style":{"height":26.24},"width":194.86,"height":65.59,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-6.png","element":"img","alt":"q2v2s ln2(qmv2/s)","inline":true,"padRight":true},{"text":"lower bound, we need to show that ","element":"span"},{"style":{"height":30.38},"width":226.69,"height":75.95,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-7.png","element":"img","alt":" v ≤√ln(m/s)√q","inline":true,"padRight":true},{"text":". At","element":"span"}],[{"style":{"width":"99%"},"width":1910,"height":64,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-8.png","element":"img"}],[{"style":{"height":17.39},"width":268.78,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-9.png","element":"img","alt":"ln(qmv2/s) ≥ 2","inline":true},{"text":". At this value, observe that:","element":"span"}],[{"style":{"width":"99%"},"width":1911,"height":199,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-10.png","element":"img"}],[{"text":"as long as ","element":"span"},{"style":{"height":15.78},"width":117.29,"height":39.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-11.png","element":"img","alt":" w ≥ e2","inline":true},{"text":". Thus, it suffices to show that ","element":"span"},{"style":{"height":27.95},"width":452.87,"height":69.88,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-12.png","element":"img","alt":"q2v21s ln2(qmv21/s) ≤ q2v2s ln2(qmv2/s)","inline":true},{"text":". When ","element":"span"},{"style":{"height":12.8},"width":137.11,"height":32,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-13.png","element":"img","alt":" m ≤ m′","inline":true},{"text":", we know that","element":"span"}],[{"style":{"width":"73%"},"width":1413,"height":388,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-14.png","element":"img"}],[{"text":"For the upper bound, we see that ","element":"span"},{"style":{"height":17.38},"width":573.23,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-15.png","element":"img","alt":" ln(2qmv4/s2) > ln(qmv4/s2) ≥ 2","inline":true,"padRight":true},{"text":"and","element":"span"},{"style":{"height":28.8},"width":40,"height":72,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-16.png","element":"img","alt":"�","inline":true}],[{"style":{"width":"85%"},"width":1634,"height":145,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-17.png","element":"img"}],[{"text":"Now, we use the fact that ","element":"span"},{"style":{"height":14},"width":258.2,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-18.png","element":"img","alt":" v ≤ Cvf1 := v1","inline":true,"padRight":true},{"text":"to see that:","element":"span"}],[{"style":{"width":"51%"},"width":980,"height":98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-19.png","element":"img"}],[{"text":"We also observe that since ","element":"span"},{"style":{"height":17.39},"width":382.93,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-20.png","element":"img","alt":" 2qmv4/s ≤ (qmv4/s)2","inline":true},{"text":", we know:","element":"span"}],[{"style":{"width":"37%"},"width":717,"height":98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-21.png","element":"img"}],[{"text":"This, coupled with the guarantee on","element":"span"},{"style":{"height":25.21},"width":57.06,"height":63.03,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-22.png","element":"img","alt":"√2q√m","inline":true,"padRight":true},{"text":", implies we have an upper bound of:","element":"span"}],[{"style":{"width":"70%"},"width":1340,"height":279,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-23.png","element":"img"}],[{"text":"Moreover, we have that","element":"span"}],[{"style":{"width":"58%"},"width":1112,"height":98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-24.png","element":"img"}],[{"text":"The next case is ","element":"span"},{"style":{"height":14},"width":126.03,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-25.png","element":"img","alt":" f1 ≤ f2","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"height":12.8},"width":137.11,"height":32,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-26.png","element":"img","alt":" m ≤ m′","inline":true},{"text":". We set ","element":"span"},{"style":{"height":9.19},"width":109.2,"height":22.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-27.png","element":"img","alt":" v = v1","inline":true},{"text":". Since ","element":"span"},{"style":{"height":14},"width":126.03,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-28.png","element":"img","alt":" f1 ≤ f2","inline":true},{"text":", we know that ","element":"span"},{"style":{"height":17.38},"width":285.65,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-29.png","element":"img","alt":" ln(qmv4/s2) ≤ q","inline":true},{"text":". Thus we know:","element":"span"}],[{"style":{"width":"85%"},"width":1626,"height":144,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/32-30.png","element":"img"}],[{"text":"For the upper bound, we know that:","element":"span"}],[{"style":{"width":"84%"},"width":1614,"height":144,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/33-0.png","element":"img"}],[{"text":"To make these bounds compatible, we need to handle the case where ","element":"span"},{"style":{"height":17.38},"width":445.76,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/33-1.png","element":"img","alt":" ln(qmv4/s) ≥ 2, qv2 ≥ s","inline":true,"padRight":true},{"text":"better. Let ","element":"span"},{"style":{"height":14},"width":167.99,"height":35,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/33-2.png","element":"img","alt":"v′ = Cvf2","inline":true},{"text":". Assuming that ","element":"span"},{"style":{"height":17.38},"width":268.78,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/33-3.png","element":"img","alt":" ln(qmv4/s) ≥ 2","inline":true},{"text":", we know that ","element":"span"},{"style":{"height":25.82},"width":195.19,"height":64.54,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/33-4.png","element":"img","alt":"8192qv2s ln(2qmv4/s)","inline":true,"padRight":true},{"text":"can be upper bounded by:","element":"span"}],[{"style":{"width":"76%"},"width":1466,"height":103,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/33-5.png","element":"img"}],[{"text":"as long as ","element":"span"},{"style":{"height":18.73},"width":294.74,"height":46.82,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/33-6.png","element":"img","alt":" ln2(mϵ/q)C4v ≥ 1","inline":true,"padRight":true},{"text":"(which we can make true by appropriately setting the constants on the bound for ","element":"span"},{"style":{"fontStyle":"italic"},"text":"m","element":"span"},{"text":"). Observe also that:","element":"span"}],[{"style":{"width":"67%"},"width":1292,"height":257,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/33-7.png","element":"img"}],[{"text":"This, coupled with the guarantee on","element":"span"},{"style":{"height":25.21},"width":57.06,"height":63.03,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/33-8.png","element":"img","alt":"√2q√m","inline":true,"padRight":true},{"text":", implies that our upper bound becomes:","element":"span"}],[{"style":{"width":"78%"},"width":1505,"height":45,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/33-9.png","element":"img"}],[{"style":{"height":16},"width":66.5,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/33-10.png","element":"img","alt":"∥R(","inline":true},{"style":{"fontStyle":"italic"},"text":"v, . . . , v, ","element":"span"},{"text":"0","element":"span"},{"style":{"fontStyle":"italic"},"text":", . . . , ","element":"span"},{"style":{"height":19.18},"width":130.9,"height":47.96,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/33-11.png","element":"img","alt":" 0)∥2q ≤","inline":true}],[{"style":{"width":"33%"},"width":641,"height":21,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/33-12.png","element":"img"}],[{"text":"We now show that we can tweak ","element":"span"},{"style":{"height":13.19},"width":44.48,"height":32.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/33-13.png","element":"img","alt":" Cv","inline":true,"padRight":true},{"text":"within the factor of ","element":"span"},{"style":{"height":14.18},"width":68.14,"height":35.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/33-14.png","element":"img","alt":" 21/4","inline":true,"padRight":true},{"text":"range permitted to show that we can ensure that it is not true that ","element":"span"},{"style":{"height":17.39},"width":456.73,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/33-15.png","element":"img","alt":" 2 − ln 2 < ln(qmv4/s) ≤ 2","inline":true},{"text":". Observe that multiplying by a factor of ","element":"span"},{"style":{"height":14.19},"width":68.14,"height":35.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/33-16.png","element":"img","alt":" 21/4","inline":true,"padRight":true},{"text":"in this case yields ","element":"span"},{"style":{"height":17.39},"width":293.98,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/33-17.png","element":"img","alt":"ln(2qmv4/s) > 2","inline":true,"padRight":true},{"text":"and dividing by a factor of ","element":"span"},{"style":{"height":14.19},"width":68.13,"height":35.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/33-18.png","element":"img","alt":" 21/4","inline":true,"padRight":true},{"text":"yields ","element":"span"},{"style":{"height":17.39},"width":384.69,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/33-19.png","element":"img","alt":" ln(qmv4/s) ≤ 2 − ln 2","inline":true},{"text":". Thus, at least one of the ","element":"span"},{"style":{"height":13.19},"width":44.48,"height":32.98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/33-20.png","element":"img","alt":" Cv","inline":true,"padRight":true},{"text":"values that yields a power of ","element":"span"},{"text":"2 ","element":"span"},{"text":"for ","element":"span"},{"style":{"height":19.37},"width":30.94,"height":48.44,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/33-21.png","element":"img","alt":"1v2","inline":true,"padRight":true},{"text":"will work. Thus, we have that","element":"span"}],[{"style":{"width":"39%"},"width":760,"height":108,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/33-22.png","element":"img"}],[{"text":"Moreover, we have that:","element":"span"}],[{"style":{"width":"52%"},"width":1010,"height":172,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/33-23.png","element":"img"}],[{"text":"The next case is that ","element":"span"},{"style":{"height":9.6},"width":137.11,"height":24,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/33-24.png","element":"img","alt":" m > m′","inline":true},{"text":". We set ","element":"span"},{"style":{"height":16},"width":189.68,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/33-25.png","element":"img","alt":" v = Cv√ϵs","inline":true}],[{"style":{"width":"38%"},"width":734,"height":143,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/33-26.png","element":"img"}],[{"text":"For the upper bound, we see that ","element":"span"},{"style":{"height":17.38},"width":573.23,"height":43.46,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/33-27.png","element":"img","alt":" ln(2qmv4/s2) > ln(qmv4/s2) > 2","inline":true},{"text":". We know:","element":"span"}],[{"style":{"width":"81%"},"width":1554,"height":145,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/33-28.png","element":"img"}],[{"text":"This can be relaxed to:","element":"span"}],[{"style":{"width":"63%"},"width":1212,"height":98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/33-29.png","element":"img"}],[{"text":"Now, we know that","element":"span"}],[{"style":{"width":"64%"},"width":1226,"height":97,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/34-0.png","element":"img"}],[{"text":"This coupled with what we know about","element":"span"},{"style":{"height":25.21},"width":57.06,"height":63.03,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/34-1.png","element":"img","alt":"√2q√m","inline":true,"padRight":true},{"text":"means that:","element":"span"}],[{"style":{"width":"70%"},"width":1340,"height":281,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/34-2.png","element":"img"}],[{"text":"Moreover, we have that","element":"span"}],[{"style":{"width":"58%"},"width":1120,"height":98,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/34-3.png","element":"img"}],[{"text":"We use the condition on ","element":"span"},{"style":{"fontStyle":"italic"},"text":"q ","element":"span"},{"text":"not being more than a constant factor away from ","element":"span"},{"style":{"height":16},"width":197.71,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/34-4.png","element":"img","alt":" p = ln(1/δ)","inline":true},{"text":", to conclude that","element":"span"}],[{"style":{"width":"99%"},"width":1910,"height":134,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/34-5.png","element":"img"}],[{"text":"move within the ","element":"span"},{"style":{"height":10.8},"width":31,"height":27,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/34-6.png","element":"img","alt":" Θ","inline":true,"padRight":true},{"text":"notation as well.","element":"span"}]]},{"heading":"I Additional Experimental Results and Discussion","paragraphs":[[{"text":"All of the experiments (in Section 4 and in this section) were run on the default hardware on a Google Colab notebook. The code is available at ","element":"span"},{"href":"https://github.com/mjagadeesan/sparsejl-featurehashing","style":{"fontFamily":"monospace"},"text":"https://github.com/mjagadeesan/sparsejl-featurehashing","element":"a"},{"text":".","element":"span"}],[{"text":"First, we give the results of additional experimental results on real-world and synthetic datasets, using the ","element":"span"},{"id":"id-69","text":"same experimental setup as Section 4.","element":"span"}],[{"style":{"width":"89%"},"width":1716,"height":568,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/34-7.png","element":"img"}],[{"text":"Figure 5: Phase transitions of ","element":"figcaption","subtype":"caption"},{"style":{"height":16},"width":280.82,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/34-8.png","element":"img","alt":" ˆv(m, 0.2, 0.01, s)","inline":true}],[{"text":"Figure 6: Phase transitions of ","element":"figcaption","subtype":"caption"},{"style":{"height":16},"width":300.74,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/34-9.png","element":"img","alt":" ˆv(m, 0.02, 0.05, s)","inline":true}],[{"text":"For the synthetic datasets, the trends in Figure ","element":"span"},{"href":"#id-69","text":"5 ","element":"a"},{"text":"and Figure ","element":"span"},{"href":"#id-69","text":"6 ","element":"a"},{"text":"look quite similar to the figures in Section 4. ","element":"span"},{"text":"We see, though, that Figure ","element":"span"},{"href":"#id-69","text":"6 ","element":"a"},{"text":"experiences more severe non-monotonic behavior as a function of ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"in the second phase transition. Consider, for example, in Figure ","element":"span"},{"href":"#id-69","text":"6, ","element":"a"},{"text":"the behavior at ","element":"span"},{"style":{"fontStyle":"italic"},"text":"m ","element":"span"},{"text":"= 12000","element":"span"},{"text":": we see that ","element":"span"},{"style":{"height":16},"width":458.76,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/34-10.png","element":"img","alt":"ˆv(m, ϵ, δ, 4) < ˆv(m, ϵ, δ, 3)","inline":true},{"text":". ","element":"span"},{"text":"In fact, the order of the phase transitions in Figure ","element":"span"},{"href":"#id-69","text":"6 ","element":"a"},{"text":"is far from decreasing. Nonetheless, the general patterns and trends in the theoretical result still hold (e.g. the “flat” part occurs at a lower y-coordinate for lower ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"values.)","element":"span"}],[{"text":"For the real-world datasets, the trends in Figure ","element":"span"},{"href":"#id-70","text":"7, ","element":"a"},{"text":"Figure ","element":"span"},{"href":"#id-70","text":"8, ","element":"a"},{"text":"and Figure ","element":"span"},{"href":"#id-70","text":"9 ","element":"a"},{"text":"look quite similar to the figures in Section 4. One slight difference is that the failure probability noticeably increases in Figure ","element":"span"},{"href":"#id-70","text":"7 ","element":"a"},{"text":"and Figure","element":"span"}],[{"id":"id-70","style":{"width":"87%"},"width":1676,"height":576,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/35-0.png","element":"img"}],[{"text":"Figure 7: ","element":"figcaption","subtype":"caption"},{"style":{"height":19.01},"width":190.73,"height":47.52,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/35-1.png","element":"img","alt":"ˆδ(m, s, 0.1)","inline":true,"padRight":true},{"text":"on News20","element":"figcaption","subtype":"caption"}],[{"text":"Figure 8: ","element":"figcaption","subtype":"caption"},{"style":{"height":19.01},"width":190.73,"height":47.52,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/35-2.png","element":"img","alt":"ˆδ(m, s, 0.1)","inline":true,"padRight":true},{"text":"on Enron","element":"figcaption","subtype":"caption"}],[{"style":{"width":"42%"},"width":817,"height":597,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/35-3.png","element":"img"}],[{"text":"Figure 9: ","element":"figcaption","subtype":"caption"},{"style":{"height":19.01},"width":210.65,"height":47.52,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/35-4.png","element":"img","alt":"ˆδ(m, s, 0.03)","inline":true,"padRight":true},{"text":"on News20","element":"figcaption","subtype":"caption"}],[{"href":"#id-70","text":"8 ","element":"a"},{"text":"between ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"= 8 ","element":"span"},{"text":"and ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"= 16","element":"span"},{"text":". It turns out that the failure probability actually increases to a local maximum somewhere in ","element":"span"},{"style":{"height":13.2},"width":218.64,"height":33,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/35-5.png","element":"img","alt":" 12 ≤ s ≤ 16","inline":true},{"text":", and then decreases when ","element":"span"},{"style":{"height":13.2},"width":118.7,"height":33,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/35-6.png","element":"img","alt":" s ≥ 16","inline":true},{"text":", reaching lower than the value at ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"= 8 ","element":"span"},{"text":"by the time ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s ","element":"span"},{"text":"= 20","element":"span"},{"text":". There turns out to be a similar local maximum phenomenon when ","element":"span"},{"style":{"height":11.6},"width":140.23,"height":29,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/35-7.png","element":"img","alt":" ϵ = 0.07","inline":true,"padRight":true},{"text":"and ","element":"span"},{"style":{"fontStyle":"italic"},"text":"m ","element":"span"},{"text":"= 500","element":"span"},{"text":", though the local maximum occurs in ","element":"span"},{"style":{"height":13.2},"width":204.72,"height":33,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/35-8.png","element":"img","alt":" 24 ≤ s ≤ 32","inline":true,"padRight":true},{"text":"and thus is not as visible in the graph.","element":"span"}],[{"text":"As a general comment on non-monotonicity as a function of ","element":"span"},{"style":{"fontStyle":"italic"},"text":"s","element":"span"},{"text":", we emphasize that our asymptotic theoretical results characterize the ","element":"span"},{"style":{"fontStyle":"italic"},"text":"macroscopic ","element":"span"},{"text":"behavior of ","element":"span"},{"style":{"height":16},"width":192.23,"height":40,"src":"https://cdn.bytez.com/mobilePapers/v2/arxiv/1903.03605/images/35-9.png","element":"img","alt":" v(m, ϵ, δ, s)","inline":true},{"text":", and do not preclude the existence of constant factor fluctuations for small changes in parameters. An interesting direction for future work would be to look further into this non-mononocity and try to characterize when it arises.","element":"span"}]]}],"_version":"3.3.2"},"paperNode":"$1b:props:children:props:children:0:props:product"}]]]}]}]