# # Copyright (c) 2006 Jun Wang # All rights reserved. # # Redistribution and use in source and binary forms, with or without # modification, are permitted provided that the following conditions # are met: # 1. Redistributions of source code must retain the above copyright # notice, this list of conditions and the following disclaimer. # 2. Redistributions in binary form must reproduce the above copyright # notice, this list of conditions and the following disclaimer in the # documentation and/or other materials provided with the distribution. # 3. All advertising materials mentioning features or use of this software # must display the following acknowledgement: # This product includes software developed by # CiteULike and its # contributors. # 4. Neither the name of CiteULike nor the names of its # contributors may be used to endorse or promote products derived # from this software without specific prior written permission. # # THIS SOFTWARE IS PROVIDED BY CITEULIKE.ORG AND CONTRIBUTORS # ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED # TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR # PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS # BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR # CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF # SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS # INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN # CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) # ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE # POSSIBILITY OF SUCH DAMAGE. plugin { # Integer version number for the plugin code. When this number is incremented, # CiteULike may reparse all existing articles with the new code. version {1} # The name of the plugin, as displayed on the "CiteULike supports..." page # name {Language Evolution and Computation} # The link the front page of this service # url {http://www.isrl.uiuc.edu/~amag/langev} # Author Name author {Jun Wang} # Author email email {junwang4@uiuc.edu} # Parser language language {perl} # Regular expression to match URLs that the plugin is # *potentially* interested in. Any URL matching this regexp # will cause your parser to be invoked. Currently, this will # require fork()ing a process, so you should try to reduce the # number of false positives by making your regexp as restrictive as # possible. If it is not possible to determine whether or not your plugin is # interested purely on the basis of the URL, you will have a chance # to refine this decision in your code. For now, try to make a # reasonable approximation - like, check for URLs on the right hostname # Note: Some universities provide mirrors of commericial publishers' sites # with different hostnames, so you should provide some leeway in your # regexp if that applies to you. regexp {http://www.isrl.uiuc.edu/~?amag/langev/paper/(.*)} } # # Linkout formatting # # CiteULike doesn't store URLs for articles. # Instead it stores the raw ingredients required to build the # dynamically. # Each plugin is required to define a small procedure which does this # formatting # See the HOWTO file for more details. # # The variables following variables are defined for your use # in the function: type ikey_1 ckey_1 ikey_2 ckey_2 # format_linkout LNGV { return [list "LangEv" "http://www.isrl.uiuc.edu/~amag/langev/paper/${ckey_1}.html"] } # # TESTS # # Each plugin MUST provide a set of tests. The motivation behind this is # that web scraping code is inherently fragile, and is likely to break # whenever the provider decides to redisign their site. CiteULike # willperiodically run tests to see if anything has broken. # Please provide as comprehensive a set of tests as possible. # If you ever fix a bug in the parser, it is highly recommended that # you add the offending page as a test case. test {http://www.isrl.uiuc.edu/~amag/langev/paper/ferrer02zipf.html} { formatted_url {LangEv http://www.isrl.uiuc.edu/~amag/langev/paper/ferrer02zipf.html} formatted_url {DOI http://dx.doi.org/10.1142/S0219525902000468} linkout {LNGV {} ferrer02zipf {} {}} linkout {DOI {} 10.1142/S0219525902000468 {} {}} author {Ferrer-I-Cancho Ramon R {Ramon Ferrer-i-Cancho}} author {Sole Ricard RV {Ricard V. Sole}} title {Zipf's law and random texts} journal {Advances in Complex Systems} volume 5 issue 1 start_page 1 end_page 6 year 2002 type JOUR doi 10.1142/S0219525902000468 url http://www.isrl.uiuc.edu/~amag/langev/paper/ferrer02zipf.html keywords {Human language; scaling; Zipf's law; monkey languages; random texts} abstract {Random-text models have been proposed as an explanation for the power law relationship between word frequency and rank, the so-called Zipf's law. They are generally regarded as null hypotheses rather than models in the strict sense. In this context, recent theories of language emergence and evolution assume this law as a priori information with no need of explanation. Here, random texts and real texts are compared through (a) the so-called lexical spectrum and (b) the distribution of words having the same length. It is shown that real texts fill the lexical spectrum much more efficiently and regardless of the word length, suggesting that the meaningfulness of Zipf's law is high.} status ok } test {http://www.isrl.uiuc.edu/~amag/langev/paper/niyogi_book.html} { formatted_url {LangEv http://www.isrl.uiuc.edu/~amag/langev/paper/niyogi_book.html} linkout {LNGV {} niyogi_book {} {}} author {Niyogi Partha P {Partha Niyogi}} year {2006} month {April} type BOOK url http://www.isrl.uiuc.edu/~amag/langev/paper/niyogi_book.html publisher {MIT Press} title {The Computational Nature of Language Learning and Evolution} status ok address {Cambridge, MA} status ok } test {http://www.isrl.uiuc.edu/~amag/langev/paper/pinker03LanguageAs.html} { formatted_url {LangEv http://www.isrl.uiuc.edu/~amag/langev/paper/pinker03LanguageAs.html} linkout {LNGV {} pinker03LanguageAs {} {}} year 2003 type INCOL url http://www.isrl.uiuc.edu/~amag/langev/paper/pinker03LanguageAs.html publisher {Oxford University Press} title_secondary {Language Evolution: The States of the Art} editor {Christiansen {} MH {M.H. Christiansen}} editor {Kirby {} S {S. Kirby}} title {Language as an adaptation to the cognitive niche} author {Pinker Steven S {Steven Pinker}} status ok }