Two Regimes in the Frequency of Words and the Origins of Complex Lexicons: Zipf's Law Revisited.
R. i Cancho, und R. Solé. Journal of Quantitative Linguistics, 8 (3):
165-173(2001)
Zusammenfassung
Zipf’s law states that the frequency of a word is a power function of its rank. The exponent of the power is usually accepted to be close to (-)1. Great deviations between the predicted and real number of different words of a text, disagreements between the predicted and real exponent of the probability density function and statistics on a big corpus, make evident that word frequency as a function of the rank follows two different exponents, ˜(-)1 for the first regime and ˜(-)2 for the second. The implications of the change in exponents for the metrics of texts and for the origins of complex lexicons are analyzed.
%0 Journal Article
%1 journals/jql/CanchoS01
%A i Cancho, Ramon Ferrer
%A Solé, Ricard V.
%D 2001
%J Journal of Quantitative Linguistics
%K complex frequency origins regimes words
%N 3
%P 165-173
%T Two Regimes in the Frequency of Words and the Origins of Complex Lexicons: Zipf's Law Revisited.
%U http://dblp.uni-trier.de/db/journals/jql/jql8.html#CanchoS01
%V 8
%X Zipf’s law states that the frequency of a word is a power function of its rank. The exponent of the power is usually accepted to be close to (-)1. Great deviations between the predicted and real number of different words of a text, disagreements between the predicted and real exponent of the probability density function and statistics on a big corpus, make evident that word frequency as a function of the rank follows two different exponents, ˜(-)1 for the first regime and ˜(-)2 for the second. The implications of the change in exponents for the metrics of texts and for the origins of complex lexicons are analyzed.
@article{journals/jql/CanchoS01,
abstract = {Zipf’s law states that the frequency of a word is a power function of its rank. The exponent of the power is usually accepted to be close to (-)1. Great deviations between the predicted and real number of different words of a text, disagreements between the predicted and real exponent of the probability density function and statistics on a big corpus, make evident that word frequency as a function of the rank follows two different exponents, ˜(-)1 for the first regime and ˜(-)2 for the second. The implications of the change in exponents for the metrics of texts and for the origins of complex lexicons are analyzed.},
added-at = {2013-11-20T09:58:34.000+0100},
author = {i Cancho, Ramon Ferrer and Solé, Ricard V.},
biburl = {https://www.bibsonomy.org/bibtex/24de686b11a700bd0cd92c1d733e0ae13/giacomo.fiumara},
ee = {http://dx.doi.org/10.1076/jqul.8.3.165.4101},
interhash = {5861a32a5a0df17703a9b5df3b8d38cd},
intrahash = {4de686b11a700bd0cd92c1d733e0ae13},
journal = {Journal of Quantitative Linguistics},
keywords = {complex frequency origins regimes words},
number = 3,
pages = {165-173},
timestamp = {2013-11-20T13:19:37.000+0100},
title = {Two Regimes in the Frequency of Words and the Origins of Complex Lexicons: Zipf's Law Revisited.},
url = {http://dblp.uni-trier.de/db/journals/jql/jql8.html#CanchoS01},
volume = 8,
year = 2001
}