Last update: 16 July, 2022.
Launched: 27 December, 2011.
Note: the largest public bibliography of references on Zipf’s law for word frequencies is available here. Here we only offer a selection of references on Zipf’s law on animal behavior and organic chemistry.
Hint for browsing: Heaps’ law is another name for Herdan’s law.
2022
Ferrer-i-Cancho, R.; Lusseau, D.; McCowan, B.
Parallels of human language in the behavior of bottlenose dolphins Journal Article
In: Linguistic Frontiers, vol. 5, no. 1, pp. 5-11, 2022.
Abstract | Links | BibTeX | Tags: Law of meaning distribution, Meaning-frequency law, Menzerath-Altmann law, theory construction, Zipf's law for word frequencies, Zipf's law of abbreviation
@article{Ferrer2022a,
title = {Parallels of human language in the behavior of bottlenose dolphins},
author = {R. Ferrer-i-Cancho and D. Lusseau and B. McCowan},
url = {https://arxiv.org/abs/1605.01661},
doi = {10.2478/lf-2022-0002},
year = {2022},
date = {2022-01-01},
journal = {Linguistic Frontiers},
volume = {5},
number = {1},
pages = {5-11},
abstract = {Dolphins exhibit striking similarities with humans. Here we review them with the help of quantitative linguistics and information theory. Various statistical laws of language that are well-known in quantitative linguistics, i.e. Zipf’s law for word frequencies, the law of meaning distribution, the law of abbreviation and Menzerath’s law, have been found in dolphin vocal or gestural behavior. The information theory of these laws suggests that humans and dolphins share cost-cutting principles of organization.},
keywords = {Law of meaning distribution, Meaning-frequency law, Menzerath-Altmann law, theory construction, Zipf's law for word frequencies, Zipf's law of abbreviation},
pubstate = {published},
tppubtype = {article}
}
Semple, S.; Ferrer-i-Cancho, R.; Gustison, M.
Linguistic laws in biology Journal Article
In: Trends in Ecology and Evolution, vol. 37, no. 1, pp. 53-66, 2022.
Abstract | Links | BibTeX | Tags: Law of meaning distribution, Meaning-frequency law, Menzerath-Altmann law, Zipf's law for word frequencies, Zipf's law of abbreviation
@article{Semple2021a,
title = {Linguistic laws in biology},
author = {S. Semple and R. Ferrer-i-Cancho and M. Gustison},
doi = {10.1016/j.tree.2021.08.012},
year = {2022},
date = {2022-01-01},
journal = {Trends in Ecology and Evolution},
volume = {37},
number = {1},
pages = {53-66},
abstract = {Linguistic laws, the common statistical patterns of human language, have been investigated by quantitative linguists for nearly a century. Recently, biologists from a range of disciplines have started to explore the prevalence of these laws beyond language, finding patterns consistent with linguistic laws across multiple levels of biological organisation - from molecular (genomes, genes and proteins) to organismal (animal behaviour) to ecological (populations and ecosystems). We propose a new conceptual framework for the study of linguistic laws in biology, comprising and integrating distinct levels of analysis - from description to prediction to theory building. Adopting this framework will provide critical new insights into the fundamental rules of organization underpinning natural systems, unifying linguistic laws and core theory in biology.},
keywords = {Law of meaning distribution, Meaning-frequency law, Menzerath-Altmann law, Zipf's law for word frequencies, Zipf's law of abbreviation},
pubstate = {published},
tppubtype = {article}
}
2021
Gultekin, Yasemin B.; Hildebrand, David G. C.; Hammerschmidt, Kurt; Hage, Steffen R.
High plasticity in marmoset monkey vocal development from infancy to adulthood Journal Article
In: Science Advances, vol. 7, no. 27, 2021.
Abstract | Links | BibTeX | Tags: Zipf's law for word frequencies
@article{Gultekineabf2938,
title = {High plasticity in marmoset monkey vocal development from infancy to adulthood},
author = {Yasemin B. Gultekin and David G. C. Hildebrand and Kurt Hammerschmidt and Steffen R. Hage},
url = {https://advances.sciencemag.org/content/7/27/eabf2938},
doi = {10.1126/sciadv.abf2938},
year = {2021},
date = {2021-01-01},
journal = {Science Advances},
volume = {7},
number = {27},
publisher = {American Association for the Advancement of Science},
abstract = {The vocal behavior of human infants undergoes marked changes across their first year while becoming increasingly speech-like. Conversely, vocal development in nonhuman primates has been assumed to be largely predetermined and completed within the first postnatal months. Contradicting this assumption, we found a dichotomy between the development of call features and vocal sequences in marmoset monkeys, suggestive of a role for experience. While changes in call features were related to physical maturation, sequences of and transitions between calls remained flexible until adulthood. As in humans, marmoset vocal behavior developed in stages correlated with motor and social development stages. These findings are evidence for a prolonged phase of plasticity during marmoset vocal development, a crucial primate evolutionary preadaptation for the emergence of vocal learning and speech.},
keywords = {Zipf's law for word frequencies},
pubstate = {published},
tppubtype = {article}
}
Caetano-Anollés, Gustavo
The compressed vocabulary of microbial life Journal Article
In: Frontiers in Microbiology, vol. 12, pp. 1273, 2021, ISSN: 1664-302X.
Abstract | Links | BibTeX | Tags: Herdan's law, Menzerath-Altmann law, Zipf's law for word frequencies, Zipf's law of abbreviation
@article{10.3389/fmicb.2021.655990,
title = {The compressed vocabulary of microbial life},
author = {Gustavo Caetano-Anoll\'{e}s},
url = {https://www.frontiersin.org/article/10.3389/fmicb.2021.655990},
doi = {10.3389/fmicb.2021.655990},
issn = {1664-302X},
year = {2021},
date = {2021-01-01},
journal = {Frontiers in Microbiology},
volume = {12},
pages = {1273},
abstract = {Communication is an undisputed central activity of life that requires an evolving molecular language. It conveys meaning through messages and vocabularies. Here, I explore the existence of a growing vocabulary in the molecules and molecular functions of the microbial world. There are clear correspondences between the lexicon, syntax, semantics, and pragmatics of language organization and the module, structure, function, and fitness paradigms of molecular biology. These correspondences are constrained by universal laws and engineering principles. Macromolecular structure, for example, follows quantitative linguistic patterns arising from statistical laws that are likely universal, including the Zipf’s law, a special case of the scale-free distribution, the Heaps’ law describing sublinear growth typical of economies of scales, and the Menzerath\textendashAltmann’s law, which imposes size-dependent patterns of decreasing returns. Trade-off solutions between principles of economy, flexibility, and robustness define a “triangle of persistence” describing the impact of the environment on a biological system. The pragmatic landscape of the triangle interfaces with the syntax and semantics of molecular languages, which together with comparative and evolutionary genomic data can explain global patterns of diversification of cellular life. The vocabularies of proteins (proteomes) and functions (functionomes) revealed a significant universal lexical core supporting a universal common ancestor, an ancestral evolutionary link between Bacteria and Eukarya, and distinct reductive evolutionary strategies of language compression in Archaea and Bacteria. A “causal” word cloud strategy inspired by the dependency grammar paradigm used in catenae unfolded the evolution of lexical units associated with Gene Ontology terms at different levels of ontological abstraction. While Archaea holds the smallest, oldest, and most homogeneous vocabulary of all superkingdoms, Bacteria heterogeneously apportions a more complex vocabulary, and Eukarya pushes functional innovation through mechanisms of flexibility and robustness.},
keywords = {Herdan's law, Menzerath-Altmann law, Zipf's law for word frequencies, Zipf's law of abbreviation},
pubstate = {published},
tppubtype = {article}
}
2014
Cadeddu, Andrea; Wylie, Elizabeth K; Jurczak, Janusz; Wampler-Doty, Matthew; Grzybowski, Bartosz A
Organic Chemistry as a Language and the Implications of Chemical Linguistics for Structural and Retrosynthetic Analyses Journal Article
In: Angewandte Chemie International Edition, vol. 53, no. 31, pp. 8108-8112, 2014.
Abstract | Links | BibTeX | Tags: Zipf's law for word frequencies
@article{doi:10.1002/anie.201403708,
title = {Organic Chemistry as a Language and the Implications of Chemical Linguistics for Structural and Retrosynthetic Analyses},
author = {Andrea Cadeddu and Elizabeth K Wylie and Janusz Jurczak and Matthew Wampler-Doty and Bartosz A Grzybowski},
url = {https://onlinelibrary.wiley.com/doi/abs/10.1002/anie.201403708},
doi = {10.1002/anie.201403708},
year = {2014},
date = {2014-01-01},
journal = {Angewandte Chemie International Edition},
volume = {53},
number = {31},
pages = {8108-8112},
abstract = {Abstract Methods of computational linguistics are used to demonstrate that a natural language such as English and organic chemistry have the same structure in terms of the frequency of, respectively, text fragments and molecular fragments. This quantitative correspondence suggests that it is possible to extend the methods of computational corpus linguistics to the analysis of organic molecules. It is shown that within organic molecules bonds that have highest information content are the ones that 1) define repeat/symmetry subunits and 2) in asymmetric molecules, define the loci of potential retrosynthetic disconnections. Linguistics-based analysis appears well-suited to the analysis of complex structural and reactivity patterns within organic molecules.},
keywords = {Zipf's law for word frequencies},
pubstate = {published},
tppubtype = {article}
}
2012
Ferrer-i-Cancho, Ramon; McCowan, Brenda
The span of correlations in dolphin whistle sequences Journal Article
In: Journal of Statistical Mechanics: Theory and Experiment, vol. 2012, no. 06, pp. P06002, 2012.
Abstract | Links | BibTeX | Tags: Zipf's law for word frequencies
@article{Ferrer_i_Cancho_2012,
title = {The span of correlations in dolphin whistle sequences},
author = {Ramon Ferrer-i-Cancho and Brenda McCowan},
url = {https://doi.org/10.1088%2F1742-5468%2F2012%2F06%2Fp06002},
doi = {10.1088/1742-5468/2012/06/p06002},
year = {2012},
date = {2012-06-01},
journal = {Journal of Statistical Mechanics: Theory and Experiment},
volume = {2012},
number = {06},
pages = {P06002},
publisher = {IOP Publishing},
abstract = {Long-range correlations are found in symbolic sequences from human language, music and
DNA. Determining the span of correlations in dolphin whistle sequences is crucial for shedding
light on their communicative complexity. Dolphin whistles share various statistical properties
with human words, i.e. Zipf’s law for word frequencies (namely that the probability of the
ith most frequent word of a text is about i−α) and a parallel of the tendency of more frequent words to have more meanings. The finding
of Zipf’s law for word frequencies in dolphin whistles has been the topic of an intense
debate on its implications. One of the major arguments against the relevance of Zipf’s law
in dolphin whistles is that it is not possible to distinguish the outcome of a die-rolling
experiment from that of a linguistic or communicative source producing Zipf’s law for word
frequencies. Here we show that statistically significant whistle\textendashwhistle correlations extend
back to the second previous whistle in the sequence, using a global randomization test, and
to the fourth previous whistle, using a local randomization test. None of these correlations
are expected by a die-rolling experiment and other simple explanations of Zipf’s law for
word frequencies, such as Simon’s model, that produce sequences of unpredictable
elements.},
keywords = {Zipf's law for word frequencies},
pubstate = {published},
tppubtype = {article}
}
DNA. Determining the span of correlations in dolphin whistle sequences is crucial for shedding
light on their communicative complexity. Dolphin whistles share various statistical properties
with human words, i.e. Zipf’s law for word frequencies (namely that the probability of the
ith most frequent word of a text is about i−α) and a parallel of the tendency of more frequent words to have more meanings. The finding
of Zipf’s law for word frequencies in dolphin whistles has been the topic of an intense
debate on its implications. One of the major arguments against the relevance of Zipf’s law
in dolphin whistles is that it is not possible to distinguish the outcome of a die-rolling
experiment from that of a linguistic or communicative source producing Zipf’s law for word
frequencies. Here we show that statistically significant whistle–whistle correlations extend
back to the second previous whistle in the sequence, using a global randomization test, and
to the fourth previous whistle, using a local randomization test. None of these correlations
are expected by a die-rolling experiment and other simple explanations of Zipf’s law for
word frequencies, such as Simon’s model, that produce sequences of unpredictable
elements.
Freeberg, T M; Lucas, J R
Information theoretical approaches to chick-a-dee calls of Carolina chickadees (Poecile carolinensis) Journal Article
In: Journal of Comparative Psychology, vol. 126, pp. 68–81, 2012.
Abstract | Links | BibTeX | Tags: Zipf's law for word frequencies
@article{Freeberg2012a,
title = {Information theoretical approaches to chick-a-dee calls of Carolina chickadees (Poecile carolinensis)},
author = {T M Freeberg and J R Lucas},
doi = {10.1037/a0024906},
year = {2012},
date = {2012-01-01},
journal = {Journal of Comparative Psychology},
volume = {126},
pages = {68\textendash81},
abstract = {One aim of this study was to apply information theoretical analyses to understanding the structural complexity of chick-a-dee calls of Carolina chickadees, Poecile carolinensis. A second aim of this study was to compare this structural complexity to that of the calls of black-capped chickadees, P. atricapillus, described in an earlier published report (Hailman, Ficken, \& Ficken, 1985). Chick-a-dee calls were recorded from Carolina chickadees in a naturalistic observation study in eastern Tennessee. Calls were analyzed using approaches from information theory, including transition probability matrices, Zipf's rules, entropies, and information coding capacities of calls and notes of calls. As described for black-capped chickadees, calls of Carolina chickadees exhibited considerable structural complexity. Most results suggested that the call of Carolina chickadees is more structurally complex than that of black-capped chickadees. These findings add support to the growing literature on the complexity of this call system in Paridae species. Furthermore, these results point to the feasibility of detailed cross-species comparative analyses that may allow strong testing of hypotheses regarding signal evolution.},
keywords = {Zipf's law for word frequencies},
pubstate = {published},
tppubtype = {article}
}
2011
Doyle, Laurance R; McCowan, Brenda; Johnston, Simon; Hanser, Sean F
Information theory, animal communication, and the search for extraterrestrial intelligence Journal Article
In: Acta Astronautica, vol. 68, no. 3, pp. 406 - 417, 2011, ISSN: 0094-5765, (SETI Special Edition).
Abstract | Links | BibTeX | Tags: Zipf's law for word frequencies
@article{DOYLE2011406,
title = {Information theory, animal communication, and the search for extraterrestrial intelligence},
author = {Laurance R Doyle and Brenda McCowan and Simon Johnston and Sean F Hanser},
url = {http://www.sciencedirect.com/science/article/pii/S0094576509005682},
doi = {https://doi.org/10.1016/j.actaastro.2009.11.018},
issn = {0094-5765},
year = {2011},
date = {2011-01-01},
journal = {Acta Astronautica},
volume = {68},
number = {3},
pages = {406 - 417},
abstract = {We present ongoing research in the application of information theory to animal communication systems with the goal of developing additional detectors and estimators for possible extraterrestrial intelligent signals. Regardless of the species, for intelligence (i.e., complex knowledge) to be transmitted certain rules of information theory must still be obeyed. We demonstrate some preliminary results of applying information theory to socially complex marine mammal species (bottlenose dolphins and humpback whales) as well as arboreal squirrel monkeys, because they almost exclusively rely on vocal signals for their communications, producing signals which can be readily characterized by signal analysis. Metrics such as Zipf's Law and higher-order information-entropic structure are emerging as indicators of the communicative complexity characteristic of an “intelligent message” content within these animals’ signals, perhaps not surprising given these species’ social complexity. In addition to human languages, for comparison we also apply these metrics to pulsar signals-perhaps (arguably) the most “organized” of stellar systems-as an example of astrophysical systems that would have to be distinguished from an extraterrestrial intelligence message by such information theoretic filters. We also look at a message transmitted from Earth (Arecibo Observatory) that contains a lot of meaning but little information in the mathematical sense we define it here. We conclude that the study of non-human communication systems on our own planet can make a valuable contribution to the detection of extraterrestrial intelligence by providing quantitative general measures of communicative complexity. Studying the complex communication systems of other intelligent species on our own planet may also be one of the best ways to deprovincialize our thinking about extraterrestrial communication systems in general.},
note = {SETI Special Edition},
keywords = {Zipf's law for word frequencies},
pubstate = {published},
tppubtype = {article}
}
2010
Genty, Emilie; Byrne, Richard W
Why do gorillas make sequences of gestures? Journal Article
In: Animal Cognition, vol. 13, no. 2, pp. 287-301, 2010, ISSN: 1435-9456.
Abstract | Links | BibTeX | Tags: Zipf's law for word frequencies
@article{Genty2010,
title = {Why do gorillas make sequences of gestures?},
author = {Emilie Genty and Richard W Byrne},
url = {https://doi.org/10.1007/s10071-009-0266-4},
doi = {10.1007/s10071-009-0266-4},
issn = {1435-9456},
year = {2010},
date = {2010-01-01},
journal = {Animal Cognition},
volume = {13},
number = {2},
pages = {287-301},
abstract = {Great ape gestures have attracted considerable research interest in recent years, prompted by their flexible and intentional pattern of use; but almost all studies have focused on single gestures. Here, we report the first quantitative analysis of sequential gesture use in western gorillas (Gorilla gorilla gorilla), using data from three captive groups and one African study site. We found no evidence that gesture sequences were given for reasons of increased communicative efficiency over single gestures. Longer sequences of repeated gestures did not increase the likelihood of response, and using a sequence was seldom in reaction to communicative failure. Sequential combination of two gestures with similar meanings did not generally increase effectiveness, and sometimes reduced it. Gesture sequences were closely associated with play contexts. Markov transition analysis showed two networks of frequently co-occurring gestures, both consisting of gestures used to regulate play. One network comprised only tactile gestures, the other a mix of silent, audible and tactile gestures; apparently, these clusters resulted from gesture use in play with proximal or distal contact, respectively. No evidence was found for syntactic effects of sequential combination: meanings changed little or not at all. Semantically, many gestures overlapped massively with others in their core information (i.e. message), and gesture messages spanned relatively few functions. We suggest that the underlying semantics of gorilla gestures is highly simplified compared to that of human words. Gesture sequences allow continual adjustment of the tempo and nature of social interactions, rather than generally conveying semantically referential information or syntactic structures.},
keywords = {Zipf's law for word frequencies},
pubstate = {published},
tppubtype = {article}
}
2007
Lucas, Jeffrey R; Freeberg, Todd M
“Information” and the chick-a-dee call: Communicating with a complex vocal system Incollection
In: Otter, K (Ed.): Ecology and Behavior of Chickadees and Titmice: An Integrated Approach, pp. 199-213, Oxford University Press, Oxford, 2007.
Abstract | Links | BibTeX | Tags: Zipf's law for word frequencies
@incollection{Lucas2007a,
title = {“Information” and the chick-a-dee call: Communicating with a complex vocal system},
author = {Jeffrey R Lucas and Todd M Freeberg},
editor = {K Otter},
doi = {10.1093/acprof:oso/9780198569992.003.0015},
year = {2007},
date = {2007-01-01},
booktitle = {Ecology and Behavior of Chickadees and Titmice: An Integrated Approach},
pages = {199-213},
publisher = {Oxford University Press},
address = {Oxford},
abstract = {This chapter addresses the potential for information encoding in the chick-a-dee complex in Carolina and other species, and the potential of this call to convey complex and multifaceted information transfer. The emphasis is on the use of field experimentation to determine the context and content of calls. The review covers some general characteristics of chickadee vocal behaviour and some of the major arguments regarding definitions of ‘communication’ and ‘information,’ as these ideas are important for interpreting the notions of complexity in the chick-a-dee call. The work of Hailmans and Fickens on the structural complexity of chick-a-dee calls in black-capped and Mexican chickadees is also discussed, along with some studies on the chick-a-dee call of Carolina chickadees and studies from others on various chickadee species, all of which address exactly what chickadees might be communicating when the birds vary the structure of their calls.},
keywords = {Zipf's law for word frequencies},
pubstate = {published},
tppubtype = {incollection}
}
2005
McCowan, B; Doyle, L R; Jenkins, J M; Hanser, S F
The appropriate use of Zipf's law in animal communication studies Journal Article
In: Animal Behaviour, vol. 69, no. 1, pp. F1 - F7, 2005, ISSN: 0003-3472.
Links | BibTeX | Tags: Zipf's law for word frequencies
@article{MCCOWAN2005F1,
title = {The appropriate use of Zipf's law in animal communication studies},
author = {B McCowan and L R Doyle and J M Jenkins and S F Hanser},
url = {http://www.sciencedirect.com/science/article/pii/S000334720400346X},
doi = {https://doi.org/10.1016/j.anbehav.2004.09.002},
issn = {0003-3472},
year = {2005},
date = {2005-01-01},
journal = {Animal Behaviour},
volume = {69},
number = {1},
pages = {F1 - F7},
keywords = {Zipf's law for word frequencies},
pubstate = {published},
tppubtype = {article}
}
Suzuki, Ryuji; Buck, John R; Tyack, Peter L
The use of Zipf's law in animal communication analysis Journal Article
In: Animal Behaviour, vol. 69, no. 1, pp. F9 - F17, 2005, ISSN: 0003-3472.
Links | BibTeX | Tags: Zipf's law for word frequencies
@article{SUZUKI2005F9,
title = {The use of Zipf's law in animal communication analysis},
author = {Ryuji Suzuki and John R Buck and Peter L Tyack},
url = {http://www.sciencedirect.com/science/article/pii/S0003347204003471},
doi = {https://doi.org/10.1016/j.anbehav.2004.08.004},
issn = {0003-3472},
year = {2005},
date = {2005-01-01},
journal = {Animal Behaviour},
volume = {69},
number = {1},
pages = {F9 - F17},
keywords = {Zipf's law for word frequencies},
pubstate = {published},
tppubtype = {article}
}
2003
Furusawa, Chikara; Kaneko, Kunihiko
Zipf's law in gene expression Journal Article
In: Physical Review Letters, vol. 90, pp. 088102, 2003.
Abstract | Links | BibTeX | Tags: Zipf's law for word frequencies
@article{Furusawa2003,
title = {Zipf's law in gene expression},
author = {Chikara Furusawa and Kunihiko Kaneko},
doi = {10.1103/PhysRevLett.90.088102},
year = {2003},
date = {2003-01-01},
journal = {Physical Review Letters},
volume = {90},
pages = {088102},
abstract = {Using data from gene expression databases on various organisms and tissues, including yeast, nematodes, human normal and cancer tissues, and embryonic stem cells, we found that the abundances of expressed genes exhibit a power-law distribution with an exponent close to -1; i.e., they obey Zipf's law. Furthermore, by simulations of a simple model with an intracellular reaction network, we found that Zipf's law of chemical abundance is a universal feature of cells where such a network optimizes the efficiency and faithfulness of self-reproduction. These findings provide novel insights into the nature of the organization of reaction dynamics in living cells.},
keywords = {Zipf's law for word frequencies},
pubstate = {published},
tppubtype = {article}
}
2002
McCowan, B; Doyle, L R; Hanser, S F
Using information theory to assess the diversity, complexity and development of communicative repertoires Journal Article
In: Journal of Comparative Psychology, vol. 116, pp. 166-172, 2002.
Abstract | Links | BibTeX | Tags: Zipf's law for word frequencies
@article{McCowan2002,
title = {Using information theory to assess the diversity, complexity and development of communicative repertoires},
author = {B McCowan and L R Doyle and S F Hanser},
doi = {10.1037/0735-7036.116.2.166},
year = {2002},
date = {2002-01-01},
journal = {Journal of Comparative Psychology},
volume = {116},
pages = {166-172},
abstract = {The application of quantitative and comparative measures from information theory on animal communication can provide novel insights into the ecological, environmental, social, and contextual properties that shape the structure, organization, and function of signal repertoires. Using 2 phylogenetically different mammalian species that share similar ecological and social constraints as examples, the authors quantitatively examined the internal structure and development of a subsystem of these species' vocal repertoires in comparison with that of human language and illustrated that these species exhibit convergent developmental processes. The authors also discussed how predictions on the structure and organization of animal communication systems can be made from this new application of information theoretic measures with respect to behavioral ecology.},
keywords = {Zipf's law for word frequencies},
pubstate = {published},
tppubtype = {article}
}
Searls, David B
The language of genes Journal Article
In: Nature, vol. 420, no. 6912, pp. 211-217, 2002, ISSN: 1476-4687.
Abstract | Links | BibTeX | Tags: Zipf's law for word frequencies
@article{Searls2002,
title = {The language of genes},
author = {David B Searls},
url = {https://doi.org/10.1038/nature01255},
doi = {10.1038/nature01255},
issn = {1476-4687},
year = {2002},
date = {2002-01-01},
journal = {Nature},
volume = {420},
number = {6912},
pages = {211-217},
abstract = {Linguistic metaphors have been woven into the fabric of molecular biology since its inception. The determination of the human genome sequence has brought these metaphors to the forefront of the popular imagination, with the natural extension of the notion of DNA as language to that of the genome as the 'book of life'. But do these analogies go deeper and, if so, can the methods developed for analysing languages be applied to molecular biology? In fact, many techniques used in bioinformatics, even if developed independently, may be seen to be grounded in linguistics. Further interweaving of these fields will be instrumental in extending our understanding of the language of life.},
keywords = {Zipf's law for word frequencies},
pubstate = {published},
tppubtype = {article}
}
1999
McCowan, Brenda; Hanser, Sean F; Doyle, Laurance R
Quantitative tools for comparing animal communication systems: information theory applied to bottlenose dolphin whistle repertoires Journal Article
In: Animal Behaviour, vol. 57, no. 2, pp. 409 - 419, 1999, ISSN: 0003-3472.
Abstract | Links | BibTeX | Tags: Zipf's law for word frequencies
@article{MCCOWAN1999409,
title = {Quantitative tools for comparing animal communication systems: information theory applied to bottlenose dolphin whistle repertoires},
author = {Brenda McCowan and Sean F Hanser and Laurance R Doyle},
url = {http://www.sciencedirect.com/science/article/pii/S0003347298910004},
doi = {https://doi.org/10.1006/anbe.1998.1000},
issn = {0003-3472},
year = {1999},
date = {1999-01-01},
journal = {Animal Behaviour},
volume = {57},
number = {2},
pages = {409 - 419},
abstract = {Comparative analysis of nonhuman animal communication systems and their complexity, particularly in comparison to human language, has been generally hampered by both a lack of sufficiently extensive data sets and appropriate analytic tools. Information theory measures provide an important quantitative tool for examining and comparing communication systems across species. In this paper we use the original application of information theory, that of statistical examination of a communication system’s structure and organization. As an example of the utility of information theory to the analysis of animal communication systems, we applied a series of information theory statistics to a statistically categorized set of bottlenose dolphinTursiops truncatus, whistle vocalizations. First, we use the first-order entropic relation in a Zipf-type diagram (Zipf 1949Human Behavior and the Principle of Least Effort) to illustrate the application of temporal statistics as comparative indicators of repertoire complexity, and as possible predictive indicators of acquisition/learning in animal vocal repertoires. Second, we illustrate the need for more extensive temporal data sets when examining the higher entropic orders, indicative of higher levels of internal informational structure, of such vocalizations, which could begin to allow the statistical reconstruction of repertoire organization. Third, we propose using ‘communication capacity’ as a measure of the degree of temporal structure and complexity of statistical correlation, represented by the values of entropic order, as an objective tool for interspecies comparison of communication complexity. In doing so, we introduce a new comparative measure, the slope of Shannon entropies, and illustrate how it potentially can be used to compare the organizational complexity of vocal repertoires across a diversity of species. Finally, we illustrate the nature and predictive application of these higher-order entropies using a preliminary sample of dolphin whistle vocalizations. The purpose of this preliminary report is to re-examine the original application of information theory to the field of animal communication, illustrate its potential utility as a comparative tool for examining the internal informational structure of animal vocal repertoires and their development, and discuss its relationship to behavioural ecology and evolutionary theory.},
keywords = {Zipf's law for word frequencies},
pubstate = {published},
tppubtype = {article}
}
1996
Burgos, Javier D.
Fractal representation of the immune B cell repertoire Journal Article
In: Biosystems, vol. 39, no. 1, pp. 19–24, 1996, ISSN: 0303-2647.
Abstract | Links | BibTeX | Tags: Zipf's law for word frequencies
@article{BURGOS199619,
title = {Fractal representation of the immune B cell repertoire},
author = {Javier D. Burgos},
url = {http://www.sciencedirect.com/science/article/pii/0303264795015744},
doi = {10.1016/0303-2647(95)01574-4},
issn = {0303-2647},
year = {1996},
date = {1996-01-01},
journal = {Biosystems},
volume = {39},
number = {1},
pages = {19--24},
abstract = {The immune repertoire is characterized by a complex and dynamic organization. Here I suggest, based on the presence of well-defined immune reactivity patterns (RP) analyzed using a linguistic analogy, that the B cell repertoires could possess a fractal structure. A simple estimation method of the fractal dimension (D) for a given immune B repertoire was developed, and D demonstrated to be an useful tool to define what complexity is regarding the immune repertoire, and to evaluate the complexity level of the immune B repertoire among age-structured groups of mice sensitized with the hemagglutinin (HA) molecule of influenza virus. Also, since a fractal-linguistic point of view, considerations are made about the ontogeny, connectivity, chaotic regimes, and size of the immune repertoire. Fractal analysis indicates that the immune repertoire shows a Zipf-like scaling behavior, a statistical property of natural languages. This result suggests that immune repertoire is structured like a powerful language.},
keywords = {Zipf's law for word frequencies},
pubstate = {published},
tppubtype = {article}
}
Burgos, Javier D.; Moreno-Tovar, Pedro
Zipf-scaling behavior in the immune system Journal Article
In: Biosystems, vol. 39, no. 3, pp. 227 - 232, 1996, ISSN: 0303-2647.
Abstract | Links | BibTeX | Tags: Zipf's law for word frequencies
@article{BURGOS1996227,
title = {Zipf-scaling behavior in the immune system},
author = {Javier D. Burgos and Pedro Moreno-Tovar},
url = {http://www.sciencedirect.com/science/article/pii/0303264796016188},
doi = {https://doi.org/10.1016/0303-2647(96)01618-8},
issn = {0303-2647},
year = {1996},
date = {1996-01-01},
journal = {Biosystems},
volume = {39},
number = {3},
pages = {227 - 232},
abstract = {The Zipf law, an approach to analyzing linguistic texts, was applied to study the Cytotoxic T Lymphocytes (CTL) repertoire, one of the major components of the immune system. A Zipf-scaling behavior was observed in those CTL repertoires obtained in normal or conventional mice. In contrast, CTL repertoires from irradiated chimeric animals, showed a non-scaling statistical behavior when tested by the Zipf analysis,suggesting that normal repertoires work like a structured biological language. The fractal dimension (D) was derived from the Zipf plots, and correlates well with the nature of the repertoires: high, D > 0.8, in conventional mice. Non-fractal, D > 1, in chimeric animals, and low, D < 0.3, in athymic mice. Then, D seems to be an useful tool to characterize the current status of the immune system.},
keywords = {Zipf's law for word frequencies},
pubstate = {published},
tppubtype = {article}
}
1994
Ficken, M S; Hailman, E D; Hailman, J P
The chick-a-dee call system of the Mexican chickadee Journal Article
In: Condor, vol. 96, pp. 70-82, 1994.
Abstract | Links | BibTeX | Tags: Zipf's law for word frequencies
@article{Ficken1994,
title = {The chick-a-dee call system of the Mexican chickadee},
author = {M S Ficken and E D Hailman and J P Hailman},
doi = {10.2307/1369065},
year = {1994},
date = {1994-01-01},
journal = {Condor},
volume = {96},
pages = {70-82},
abstract = {Chick-a-dee calls of the Mexican Chickadee (Parus sclateri) are composed of combinations of three common note types (A, C and D) and one very rare type (B). Calls have the invariant sequence of notes A-B-C-D, where any note type may be omitted, given once or repeated a variable number of times before transiting to the next type. The B and C notes are phonologically similar to the B and C notes of chick-a-dee calls of the Black-capped Chickadee (P. atricapillus), but the A note is markedly different and the D note somewhat different from equivalent notes of the congener. A total of 2,071 calls recorded yielded 60 different call types, and Zipf-Mandelbrot plots show that the call system is "open"; as the sample size is increased new call types will be found without demonstrable bound. In relatively undisturbed contexts (with mate on territory, in fall flocks, alone in fall) birds gave mainly [A][D] calls with lesser numbers of [A] and [C] calls, where brackets indicate variable repetition of note types. In disturbed contexts (mobbing plastic Great Horned Owl, mobbing speaker playing calls of the Northern Pygmy-Owl, observer sitting under the nest cavity) the birds gave more [C] calls with [A][C] as well. In the longest mobbing session to owl calls, birds gave mainly [A] calls when approaching, switched to [C] calls while flying about the speaker, and then resumed [A] calls and moved off when the playback was stopped. Outside of human language, this is the second truly combinatorial system of vocal communication found in animals, the first being chick-a-dee calls of the Black-capped Chickadee. This study provides the first data substantiating quantitative differences in calls from different contexts, an important step toward understanding what kinds of information combinatorial chick-a-dee calls encode.},
keywords = {Zipf's law for word frequencies},
pubstate = {published},
tppubtype = {article}
}
Hailman, J P
Constrained permutation in 'chick-a-dee' like calls of a black-lored tit em Parus em Xanthogenys Journal Article
In: Bioacoustics, vol. 6, pp. 33-50, 1994.
Abstract | Links | BibTeX | Tags: Zipf's law for word frequencies
@article{Hailman1994,
title = {Constrained permutation in 'chick-a-dee' like calls of a black-lored tit em Parus em Xanthogenys},
author = {J P Hailman},
doi = {10.1080/09524622.1994.9753270},
year = {1994},
date = {1994-01-01},
journal = {Bioacoustics},
volume = {6},
pages = {33-50},
abstract = {Examined the vocalizations of 2 wild-caught black-lored tits. It was found that the Ss gave chick-a-dee-like calls in response to a stuffed owl. The tit used combinations of 4 note types to create 65 different call types. The repertoire of call types had the language-like property of openness to formation of new call types without limit. Calling under constant stimulus conditions changed unidirectionally during the course of mobbing, with the 4 note types replacing each other in calls, as time progressed. Thus, the tit had a constrained type of permuted order of note types, which enlarged the potential for call variety and closely resembled properties of language.},
keywords = {Zipf's law for word frequencies},
pubstate = {published},
tppubtype = {article}
}
1990
Markov, Vladimir I; Ostrovskaya, Vera M
Organization of Communication System in Tursiops Truncatus Montagu Incollection
In: Thomas, Jeanette A; Kastelein, Ronald A (Ed.): Sensory Abilities of Cetaceans: Laboratory and Field Evidence, pp. 599–622, Springer US, Boston, MA, 1990, ISBN: 978-1-4899-0858-2.
Abstract | Links | BibTeX | Tags: Zipf's law for word frequencies
@incollection{Markov1990,
title = {Organization of Communication System in Tursiops Truncatus Montagu},
author = {Vladimir I Markov and Vera M Ostrovskaya},
editor = {Jeanette A Thomas and Ronald A Kastelein},
url = {https://doi.org/10.1007/978-1-4899-0858-2_42},
doi = {10.1007/978-1-4899-0858-2_42},
isbn = {978-1-4899-0858-2},
year = {1990},
date = {1990-01-01},
booktitle = {Sensory Abilities of Cetaceans: Laboratory and Field Evidence},
pages = {599--622},
publisher = {Springer US},
address = {Boston, MA},
abstract = {The problem of the degree of complexity and semantic capabilities of the acoustic communicative system in bottlenose dolphins has been under discussion for over a quarter of a century, ever since John Lilly published his book ``Man and Dolphin'' (Lilly, 1962). Nowadays, there is an abundance of literature, with different viewpoints, but no consensus has been reached so far among researchers. The problem proved to be very complicated, both methodologically and experimentally, while the methods used turned-out to be labor-consuming and, on the whole, inefficient; all kinds of straightforward attacks failed. Meanwhile, one can try and assess potential capabilities of communicative system by analysing dolphins' mechanisms ensuring its productivity, i.e. the creation of signals and messages in amounts nessesary for communication. These mechanisms ensure the encoding of information and, in accordance with the theory, their functioning, in this way or other, affects the structure of signals and their sequences, in other words, it affects the organization of communicative system.},
keywords = {Zipf's law for word frequencies},
pubstate = {published},
tppubtype = {incollection}
}
1988
Howes-Jones, Daryl; Barlow, Jon C; Museum., Royal Ontario
The structure of the call note system of the warbling vireo Book
Royal Ontario Museum, Toronto, 1988, (The authors actually reports evidence of an exponential-like distribution, rather than the power-law like distribution of Zipf's law for word frequencies.).
Links | BibTeX | Tags: Zipf's law for word frequencies
@book{bhl113530,
title = {The structure of the call note system of the warbling vireo},
author = {Daryl Howes-Jones and Jon C Barlow and Royal Ontario Museum.},
url = {https://www.biodiversitylibrary.org/item/113530},
doi = {10.5962/bhl.title.53490},
year = {1988},
date = {1988-01-01},
pages = {52},
publisher = {Royal Ontario Museum},
address = {Toronto},
note = {The authors actually reports evidence of an exponential-like distribution, rather than the power-law like distribution of Zipf's law for word frequencies.},
keywords = {Zipf's law for word frequencies},
pubstate = {published},
tppubtype = {book}
}
1986
Bender, M. L.; Gill, Pritmohinder
The genetic code and Zipf's Law Journal Article
In: Current Anthropology, vol. 27, no. 3, pp. 280–283, 1986, ISSN: 00113204, 15375382.
Links | BibTeX | Tags: Zipf's law for word frequencies
@article{10.2307/2742889,
title = {The genetic code and Zipf's Law},
author = {M. L. Bender and Pritmohinder Gill},
url = {http://www.jstor.org/stable/2742889},
issn = {00113204, 15375382},
year = {1986},
date = {1986-01-01},
journal = {Current Anthropology},
volume = {27},
number = {3},
pages = {280--283},
publisher = {University of Chicago Press, Wenner-Gren Foundation for Anthropological Research},
keywords = {Zipf's law for word frequencies},
pubstate = {published},
tppubtype = {article}
}