Hostname.php 36 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794
  1. <?php
  2. /**
  3. * Zend Framework
  4. *
  5. * LICENSE
  6. *
  7. * This source file is subject to the new BSD license that is bundled
  8. * with this package in the file LICENSE.txt.
  9. * It is also available through the world-wide-web at this URL:
  10. * http://framework.zend.com/license/new-bsd
  11. * If you did not receive a copy of the license and are unable to
  12. * obtain it through the world-wide-web, please send an email
  13. * to license@zend.com so we can send you a copy immediately.
  14. *
  15. * @category Zend
  16. * @package Zend_Validate
  17. * @copyright Copyright (c) 2005-2012 Zend Technologies USA Inc. (http://www.zend.com)
  18. * @license http://framework.zend.com/license/new-bsd New BSD License
  19. * @version $Id$
  20. */
  21. /**
  22. * @see Zend_Validate_Abstract
  23. */
  24. require_once 'Zend/Validate/Abstract.php';
  25. /**
  26. * @see Zend_Validate_Ip
  27. */
  28. require_once 'Zend/Validate/Ip.php';
  29. /**
  30. * Please note there are two standalone test scripts for testing IDN characters due to problems
  31. * with file encoding.
  32. *
  33. * The first is tests/Zend/Validate/HostnameTestStandalone.php which is designed to be run on
  34. * the command line.
  35. *
  36. * The second is tests/Zend/Validate/HostnameTestForm.php which is designed to be run via HTML
  37. * to allow users to test entering UTF-8 characters in a form.
  38. *
  39. * @category Zend
  40. * @package Zend_Validate
  41. * @copyright Copyright (c) 2005-2012 Zend Technologies USA Inc. (http://www.zend.com)
  42. * @license http://framework.zend.com/license/new-bsd New BSD License
  43. */
  44. class Zend_Validate_Hostname extends Zend_Validate_Abstract
  45. {
  46. const CANNOT_DECODE_PUNYCODE = 'hostnameCannotDecodePunycode';
  47. const INVALID = 'hostnameInvalid';
  48. const INVALID_DASH = 'hostnameDashCharacter';
  49. const INVALID_HOSTNAME = 'hostnameInvalidHostname';
  50. const INVALID_HOSTNAME_SCHEMA = 'hostnameInvalidHostnameSchema';
  51. const INVALID_LOCAL_NAME = 'hostnameInvalidLocalName';
  52. const INVALID_URI = 'hostnameInvalidUri';
  53. const IP_ADDRESS_NOT_ALLOWED = 'hostnameIpAddressNotAllowed';
  54. const LOCAL_NAME_NOT_ALLOWED = 'hostnameLocalNameNotAllowed';
  55. const UNDECIPHERABLE_TLD = 'hostnameUndecipherableTld';
  56. const UNKNOWN_TLD = 'hostnameUnknownTld';
  57. /**
  58. * @var array
  59. */
  60. protected $_messageTemplates = array(
  61. self::CANNOT_DECODE_PUNYCODE => "'%value%' appears to be a DNS hostname but the given punycode notation cannot be decoded",
  62. self::INVALID => "Invalid type given. String expected",
  63. self::INVALID_DASH => "'%value%' appears to be a DNS hostname but contains a dash in an invalid position",
  64. self::INVALID_HOSTNAME => "'%value%' does not match the expected structure for a DNS hostname",
  65. self::INVALID_HOSTNAME_SCHEMA => "'%value%' appears to be a DNS hostname but cannot match against hostname schema for TLD '%tld%'",
  66. self::INVALID_LOCAL_NAME => "'%value%' does not appear to be a valid local network name",
  67. self::INVALID_URI => "'%value%' does not appear to be a valid URI hostname",
  68. self::IP_ADDRESS_NOT_ALLOWED => "'%value%' appears to be an IP address, but IP addresses are not allowed",
  69. self::LOCAL_NAME_NOT_ALLOWED => "'%value%' appears to be a local network name but local network names are not allowed",
  70. self::UNDECIPHERABLE_TLD => "'%value%' appears to be a DNS hostname but cannot extract TLD part",
  71. self::UNKNOWN_TLD => "'%value%' appears to be a DNS hostname but cannot match TLD against known list",
  72. );
  73. /**
  74. * @var array
  75. */
  76. protected $_messageVariables = array(
  77. 'tld' => '_tld'
  78. );
  79. /**
  80. * Allows Internet domain names (e.g., example.com)
  81. */
  82. const ALLOW_DNS = 1;
  83. /**
  84. * Allows IP addresses
  85. */
  86. const ALLOW_IP = 2;
  87. /**
  88. * Allows local network names (e.g., localhost, www.localdomain)
  89. */
  90. const ALLOW_LOCAL = 4;
  91. /**
  92. * Allows all types of hostnames
  93. */
  94. const ALLOW_URI = 8;
  95. /**
  96. * Allows all types of hostnames
  97. */
  98. const ALLOW_ALL = 15;
  99. /**
  100. * Array of valid top-level-domains
  101. *
  102. * @see ftp://data.iana.org/TLD/tlds-alpha-by-domain.txt List of all TLDs by domain
  103. * @see http://www.iana.org/domains/root/db/ Official list of supported TLDs
  104. * @var array
  105. */
  106. protected $_validTlds = array(
  107. 'ac', 'ad', 'ae', 'aero', 'af', 'ag', 'ai', 'al', 'am', 'an', 'ao', 'aq', 'ar', 'arpa',
  108. 'as', 'asia', 'at', 'au', 'aw', 'ax', 'az', 'ba', 'bb', 'bd', 'be', 'bf', 'bg', 'bh', 'bi',
  109. 'biz', 'bj', 'bm', 'bn', 'bo', 'br', 'bs', 'bt', 'bv', 'bw', 'by', 'bz', 'ca', 'cat', 'cc',
  110. 'cd', 'cf', 'cg', 'ch', 'ci', 'ck', 'cl', 'cm', 'cn', 'co', 'com', 'coop', 'cr', 'cu',
  111. 'cv', 'cx', 'cy', 'cz', 'de', 'dj', 'dk', 'dm', 'do', 'dz', 'ec', 'edu', 'ee', 'eg', 'er',
  112. 'es', 'et', 'eu', 'fi', 'fj', 'fk', 'fm', 'fo', 'fr', 'ga', 'gb', 'gd', 'ge', 'gf', 'gg',
  113. 'gh', 'gi', 'gl', 'gm', 'gn', 'gov', 'gp', 'gq', 'gr', 'gs', 'gt', 'gu', 'gw', 'gy', 'hk',
  114. 'hm', 'hn', 'hr', 'ht', 'hu', 'id', 'ie', 'il', 'im', 'in', 'info', 'int', 'io', 'iq',
  115. 'ir', 'is', 'it', 'je', 'jm', 'jo', 'jobs', 'jp', 'ke', 'kg', 'kh', 'ki', 'km', 'kn', 'kp',
  116. 'kr', 'kw', 'ky', 'kz', 'la', 'lb', 'lc', 'li', 'lk', 'lr', 'ls', 'lt', 'lu', 'lv', 'ly',
  117. 'ma', 'mc', 'md', 'me', 'mg', 'mh', 'mil', 'mk', 'ml', 'mm', 'mn', 'mo', 'mobi', 'mp',
  118. 'mq', 'mr', 'ms', 'mt', 'mu', 'museum', 'mv', 'mw', 'mx', 'my', 'mz', 'na', 'name', 'nc',
  119. 'ne', 'net', 'nf', 'ng', 'ni', 'nl', 'no', 'np', 'nr', 'nu', 'nz', 'om', 'org', 'pa', 'pe',
  120. 'pf', 'pg', 'ph', 'pk', 'pl', 'pm', 'pn', 'pr', 'pro', 'ps', 'pt', 'pw', 'py', 'qa', 're',
  121. 'ro', 'rs', 'ru', 'rw', 'sa', 'sb', 'sc', 'sd', 'se', 'sg', 'sh', 'si', 'sj', 'sk', 'sl',
  122. 'sm', 'sn', 'so', 'sr', 'st', 'su', 'sv', 'sy', 'sz', 'tc', 'td', 'tel', 'tf', 'tg', 'th',
  123. 'tj', 'tk', 'tl', 'tm', 'tn', 'to', 'tp', 'tr', 'travel', 'tt', 'tv', 'tw', 'tz', 'ua',
  124. 'ug', 'uk', 'um', 'us', 'uy', 'uz', 'va', 'vc', 've', 'vg', 'vi', 'vn', 'vu', 'wf', 'ws',
  125. 'xxx', 'ye', 'yt', 'yu', 'za', 'zm', 'zw'
  126. );
  127. /**
  128. * @var string
  129. */
  130. protected $_tld;
  131. /**
  132. * Array for valid Idns
  133. * @see http://www.iana.org/domains/idn-tables/ Official list of supported IDN Chars
  134. * (.AC) Ascension Island http://www.nic.ac/pdf/AC-IDN-Policy.pdf
  135. * (.AR) Argentinia http://www.nic.ar/faqidn.html
  136. * (.AS) American Samoa http://www.nic.as/idn/chars.cfm
  137. * (.AT) Austria http://www.nic.at/en/service/technical_information/idn/charset_converter/
  138. * (.BIZ) International http://www.iana.org/domains/idn-tables/
  139. * (.BR) Brazil http://registro.br/faq/faq6.html
  140. * (.BV) Bouvett Island http://www.norid.no/domeneregistrering/idn/idn_nyetegn.en.html
  141. * (.CA) Canada http://www.iana.org/domains/idn-tables/tables/ca_fr_1.0.html
  142. * (.CAT) Catalan http://www.iana.org/domains/idn-tables/tables/cat_ca_1.0.html
  143. * (.CH) Switzerland https://nic.switch.ch/reg/ocView.action?res=EF6GW2JBPVTG67DLNIQXU234MN6SC33JNQQGI7L6#anhang1
  144. * (.CL) Chile http://www.iana.org/domains/idn-tables/tables/cl_latn_1.0.html
  145. * (.COM) International http://www.verisign.com/information-services/naming-services/internationalized-domain-names/index.html
  146. * (.DE) Germany http://www.denic.de/en/domains/idns/liste.html
  147. * (.DK) Danmark http://www.dk-hostmaster.dk/index.php?id=151
  148. * (.ES) Spain https://www.nic.es/media/2008-05/1210147705287.pdf
  149. * (.FI) Finland http://www.ficora.fi/en/index/palvelut/fiverkkotunnukset/aakkostenkaytto.html
  150. * (.GR) Greece https://grweb.ics.forth.gr/CharacterTable1_en.jsp
  151. * (.HU) Hungary http://www.domain.hu/domain/English/szabalyzat/szabalyzat.html
  152. * (.INFO) International http://www.nic.info/info/idn
  153. * (.IO) British Indian Ocean Territory http://www.nic.io/IO-IDN-Policy.pdf
  154. * (.IR) Iran http://www.nic.ir/Allowable_Characters_dot-iran
  155. * (.IS) Iceland http://www.isnic.is/domain/rules.php
  156. * (.KR) Korea http://www.iana.org/domains/idn-tables/tables/kr_ko-kr_1.0.html
  157. * (.LI) Liechtenstein https://nic.switch.ch/reg/ocView.action?res=EF6GW2JBPVTG67DLNIQXU234MN6SC33JNQQGI7L6#anhang1
  158. * (.LT) Lithuania http://www.domreg.lt/static/doc/public/idn_symbols-en.pdf
  159. * (.MD) Moldova http://www.register.md/
  160. * (.MUSEUM) International http://www.iana.org/domains/idn-tables/tables/museum_latn_1.0.html
  161. * (.NET) International http://www.verisign.com/information-services/naming-services/internationalized-domain-names/index.html
  162. * (.NO) Norway http://www.norid.no/domeneregistrering/idn/idn_nyetegn.en.html
  163. * (.NU) Niue http://www.worldnames.net/
  164. * (.ORG) International http://www.pir.org/index.php?db=content/FAQs&tbl=FAQs_Registrant&id=2
  165. * (.PE) Peru https://www.nic.pe/nuevas_politicas_faq_2.php
  166. * (.PL) Poland http://www.dns.pl/IDN/allowed_character_sets.pdf
  167. * (.PR) Puerto Rico http://www.nic.pr/idn_rules.asp
  168. * (.PT) Portugal https://online.dns.pt/dns_2008/do?com=DS;8216320233;111;+PAGE(4000058)+K-CAT-CODIGO(C.125)+RCNT(100);
  169. * (.RU) Russia http://www.iana.org/domains/idn-tables/tables/ru_ru-ru_1.0.html
  170. * (.RS) Serbia http://www.iana.org/domains/idn-tables/tables/rs_sr-rs_1.0.pdf
  171. * (.SA) Saudi Arabia http://www.iana.org/domains/idn-tables/tables/sa_ar_1.0.html
  172. * (.SE) Sweden http://www.iis.se/english/IDN_campaignsite.shtml?lang=en
  173. * (.SH) Saint Helena http://www.nic.sh/SH-IDN-Policy.pdf
  174. * (.SJ) Svalbard and Jan Mayen http://www.norid.no/domeneregistrering/idn/idn_nyetegn.en.html
  175. * (.TH) Thailand http://www.iana.org/domains/idn-tables/tables/th_th-th_1.0.html
  176. * (.TM) Turkmenistan http://www.nic.tm/TM-IDN-Policy.pdf
  177. * (.TR) Turkey https://www.nic.tr/index.php
  178. * (.UA) Ukraine http://www.iana.org/domains/idn-tables/tables/ua_cyrl_1.2.html
  179. * (.VE) Venice http://www.iana.org/domains/idn-tables/tables/ve_es_1.0.html
  180. * (.VN) Vietnam http://www.vnnic.vn/english/5-6-300-2-2-04-20071115.htm#1.%20Introduction
  181. *
  182. * @var array
  183. */
  184. protected $_validIdns = array(
  185. 'AC' => array(1 => '/^[\x{002d}0-9a-zà-öø-ÿāăąćĉċčďđēėęěĝġģĥħīįĵķĺļľŀłńņňŋőœŕŗřśŝşšţťŧūŭůűųŵŷźżž]{1,63}$/iu'),
  186. 'AR' => array(1 => '/^[\x{002d}0-9a-zà-ãç-êìíñ-õü]{1,63}$/iu'),
  187. 'AS' => array(1 => '/^[\x{002d}0-9a-zà-öø-ÿāăąćĉċčďđēĕėęěĝğġģĥħĩīĭįıĵķĸĺļľłńņňŋōŏőœŕŗřśŝşšţťŧũūŭůűųŵŷźż]{1,63}$/iu'),
  188. 'AT' => array(1 => '/^[\x{002d}0-9a-zà-öø-ÿœšž]{1,63}$/iu'),
  189. 'BIZ' => 'Hostname/Biz.php',
  190. 'BR' => array(1 => '/^[\x{002d}0-9a-zà-ãçéíó-õúü]{1,63}$/iu'),
  191. 'BV' => array(1 => '/^[\x{002d}0-9a-zàáä-éêñ-ôöøüčđńŋšŧž]{1,63}$/iu'),
  192. 'CA' => array(1 => '/^[\x{002d}0-9a-zàâæçéèêëîïôœùûüÿ\x{00E0}\x{00E2}\x{00E7}\x{00E8}\x{00E9}\x{00EA}\x{00EB}\x{00EE}\x{00EF}\x{00F4}\x{00F9}\x{00FB}\x{00FC}\x{00E6}\x{0153}\x{00FF}]{1,63}$/iu'),
  193. 'CAT' => array(1 => '/^[\x{002d}0-9a-z·àç-éíïòóúü]{1,63}$/iu'),
  194. 'CH' => array(1 => '/^[\x{002d}0-9a-zà-öø-ÿœ]{1,63}$/iu'),
  195. 'CL' => array(1 => '/^[\x{002d}0-9a-záéíñóúü]{1,63}$/iu'),
  196. 'CN' => 'Hostname/Cn.php',
  197. 'COM' => 'Zend/Validate/Hostname/Com.php',
  198. 'DE' => array(1 => '/^[\x{002d}0-9a-zà-öø-ÿăąāćĉčċďđĕěėęēğĝġģĥħĭĩįīıĵķĺľļłńňņŋŏőōœĸŕřŗśŝšşťţŧŭůűũųūŵŷźžż]{1,63}$/iu'),
  199. 'DK' => array(1 => '/^[\x{002d}0-9a-zäéöüæøå]{1,63}$/iu'),
  200. 'ES' => array(1 => '/^[\x{002d}0-9a-zàáçèéíïñòóúü·]{1,63}$/iu'),
  201. 'EU' => array(1 => '/^[\x{002d}0-9a-zà-öø-ÿ]{1,63}$/iu',
  202. 2 => '/^[\x{002d}0-9a-zāăąćĉċčďđēĕėęěĝğġģĥħĩīĭįıĵķĺļľŀłńņňʼnŋōŏőœŕŗřśŝšťŧũūŭůűųŵŷźżž]{1,63}$/iu',
  203. 3 => '/^[\x{002d}0-9a-zșț]{1,63}$/iu',
  204. 4 => '/^[\x{002d}0-9a-zΐάέήίΰαβγδεζηθικλμνξοπρςστυφχψωϊϋόύώ]{1,63}$/iu',
  205. 5 => '/^[\x{002d}0-9a-zабвгдежзийклмнопрстуфхцчшщъыьэюя]{1,63}$/iu',
  206. 6 => '/^[\x{002d}0-9a-zἀ-ἇἐ-ἕἠ-ἧἰ-ἷὀ-ὅὐ-ὗὠ-ὧὰ-ώᾀ-ᾇᾐ-ᾗᾠ-ᾧᾰ-ᾴᾶᾷῂῃῄῆῇῐ-ΐῖῗῠ-ῧῲῳῴῶῷ]{1,63}$/iu'),
  207. 'FI' => array(1 => '/^[\x{002d}0-9a-zäåö]{1,63}$/iu'),
  208. 'GR' => array(1 => '/^[\x{002d}0-9a-zΆΈΉΊΌΎ-ΡΣ-ώἀ-ἕἘ-Ἕἠ-ὅὈ-Ὅὐ-ὗὙὛὝὟ-ώᾀ-ᾴᾶ-ᾼῂῃῄῆ-ῌῐ-ΐῖ-Ίῠ-Ῥῲῳῴῶ-ῼ]{1,63}$/iu'),
  209. 'HK' => 'Zend/Validate/Hostname/Cn.php',
  210. 'HU' => array(1 => '/^[\x{002d}0-9a-záéíóöúüőű]{1,63}$/iu'),
  211. 'INFO'=> array(1 => '/^[\x{002d}0-9a-zäåæéöøü]{1,63}$/iu',
  212. 2 => '/^[\x{002d}0-9a-záéíóöúüőű]{1,63}$/iu',
  213. 3 => '/^[\x{002d}0-9a-záæéíðóöúýþ]{1,63}$/iu',
  214. 4 => '/^[\x{AC00}-\x{D7A3}]{1,17}$/iu',
  215. 5 => '/^[\x{002d}0-9a-zāčēģīķļņōŗšūž]{1,63}$/iu',
  216. 6 => '/^[\x{002d}0-9a-ząčėęįšūųž]{1,63}$/iu',
  217. 7 => '/^[\x{002d}0-9a-zóąćęłńśźż]{1,63}$/iu',
  218. 8 => '/^[\x{002d}0-9a-záéíñóúü]{1,63}$/iu'),
  219. 'IO' => array(1 => '/^[\x{002d}0-9a-zà-öø-ÿăąāćĉčċďđĕěėęēğĝġģĥħĭĩįīıĵķĺľļłńňņŋŏőōœĸŕřŗśŝšşťţŧŭůűũųūŵŷźžż]{1,63}$/iu'),
  220. 'IS' => array(1 => '/^[\x{002d}0-9a-záéýúíóþæöð]{1,63}$/iu'),
  221. 'JP' => 'Zend/Validate/Hostname/Jp.php',
  222. 'KR' => array(1 => '/^[\x{AC00}-\x{D7A3}]{1,17}$/iu'),
  223. 'LI' => array(1 => '/^[\x{002d}0-9a-zà-öø-ÿœ]{1,63}$/iu'),
  224. 'LT' => array(1 => '/^[\x{002d}0-9ąčęėįšųūž]{1,63}$/iu'),
  225. 'MD' => array(1 => '/^[\x{002d}0-9ăâîşţ]{1,63}$/iu'),
  226. 'MUSEUM' => array(1 => '/^[\x{002d}0-9a-zà-öø-ÿāăąćċčďđēėęěğġģħīįıķĺļľłńņňŋōőœŕŗřśşšţťŧūůűųŵŷźżžǎǐǒǔ\x{01E5}\x{01E7}\x{01E9}\x{01EF}ə\x{0292}ẁẃẅỳ]{1,63}$/iu'),
  227. 'NET' => 'Zend/Validate/Hostname/Com.php',
  228. 'NO' => array(1 => '/^[\x{002d}0-9a-zàáä-éêñ-ôöøüčđńŋšŧž]{1,63}$/iu'),
  229. 'NU' => 'Zend/Validate/Hostname/Com.php',
  230. 'ORG' => array(1 => '/^[\x{002d}0-9a-záéíñóúü]{1,63}$/iu',
  231. 2 => '/^[\x{002d}0-9a-zóąćęłńśźż]{1,63}$/iu',
  232. 3 => '/^[\x{002d}0-9a-záäåæéëíðóöøúüýþ]{1,63}$/iu',
  233. 4 => '/^[\x{002d}0-9a-záéíóöúüőű]{1,63}$/iu',
  234. 5 => '/^[\x{002d}0-9a-ząčėęįšūųž]{1,63}$/iu',
  235. 6 => '/^[\x{AC00}-\x{D7A3}]{1,17}$/iu',
  236. 7 => '/^[\x{002d}0-9a-zāčēģīķļņōŗšūž]{1,63}$/iu'),
  237. 'PE' => array(1 => '/^[\x{002d}0-9a-zñáéíóúü]{1,63}$/iu'),
  238. 'PL' => array(1 => '/^[\x{002d}0-9a-zāčēģīķļņōŗšūž]{1,63}$/iu',
  239. 2 => '/^[\x{002d}а-ик-ш\x{0450}ѓѕјљњќџ]{1,63}$/iu',
  240. 3 => '/^[\x{002d}0-9a-zâîăşţ]{1,63}$/iu',
  241. 4 => '/^[\x{002d}0-9а-яё\x{04C2}]{1,63}$/iu',
  242. 5 => '/^[\x{002d}0-9a-zàáâèéêìíîòóôùúûċġħż]{1,63}$/iu',
  243. 6 => '/^[\x{002d}0-9a-zàäåæéêòóôöøü]{1,63}$/iu',
  244. 7 => '/^[\x{002d}0-9a-zóąćęłńśźż]{1,63}$/iu',
  245. 8 => '/^[\x{002d}0-9a-zàáâãçéêíòóôõúü]{1,63}$/iu',
  246. 9 => '/^[\x{002d}0-9a-zâîăşţ]{1,63}$/iu',
  247. 10=> '/^[\x{002d}0-9a-záäéíóôúýčďĺľňŕšťž]{1,63}$/iu',
  248. 11=> '/^[\x{002d}0-9a-zçë]{1,63}$/iu',
  249. 12=> '/^[\x{002d}0-9а-ик-шђјљњћџ]{1,63}$/iu',
  250. 13=> '/^[\x{002d}0-9a-zćčđšž]{1,63}$/iu',
  251. 14=> '/^[\x{002d}0-9a-zâçöûüğış]{1,63}$/iu',
  252. 15=> '/^[\x{002d}0-9a-záéíñóúü]{1,63}$/iu',
  253. 16=> '/^[\x{002d}0-9a-zäõöüšž]{1,63}$/iu',
  254. 17=> '/^[\x{002d}0-9a-zĉĝĥĵŝŭ]{1,63}$/iu',
  255. 18=> '/^[\x{002d}0-9a-zâäéëîô]{1,63}$/iu',
  256. 19=> '/^[\x{002d}0-9a-zàáâäåæçèéêëìíîïðñòôöøùúûüýćčłńřśš]{1,63}$/iu',
  257. 20=> '/^[\x{002d}0-9a-zäåæõöøüšž]{1,63}$/iu',
  258. 21=> '/^[\x{002d}0-9a-zàáçèéìíòóùú]{1,63}$/iu',
  259. 22=> '/^[\x{002d}0-9a-zàáéíóöúüőű]{1,63}$/iu',
  260. 23=> '/^[\x{002d}0-9ΐά-ώ]{1,63}$/iu',
  261. 24=> '/^[\x{002d}0-9a-zàáâåæçèéêëðóôöøüþœ]{1,63}$/iu',
  262. 25=> '/^[\x{002d}0-9a-záäéíóöúüýčďěňřšťůž]{1,63}$/iu',
  263. 26=> '/^[\x{002d}0-9a-z·àçèéíïòóúü]{1,63}$/iu',
  264. 27=> '/^[\x{002d}0-9а-ъьюя\x{0450}\x{045D}]{1,63}$/iu',
  265. 28=> '/^[\x{002d}0-9а-яёіў]{1,63}$/iu',
  266. 29=> '/^[\x{002d}0-9a-ząčėęįšūųž]{1,63}$/iu',
  267. 30=> '/^[\x{002d}0-9a-záäåæéëíðóöøúüýþ]{1,63}$/iu',
  268. 31=> '/^[\x{002d}0-9a-zàâæçèéêëîïñôùûüÿœ]{1,63}$/iu',
  269. 32=> '/^[\x{002d}0-9а-щъыьэюяёєіїґ]{1,63}$/iu',
  270. 33=> '/^[\x{002d}0-9א-ת]{1,63}$/iu'),
  271. 'PR' => array(1 => '/^[\x{002d}0-9a-záéíóúñäëïüöâêîôûàèùæçœãõ]{1,63}$/iu'),
  272. 'PT' => array(1 => '/^[\x{002d}0-9a-záàâãçéêíóôõú]{1,63}$/iu'),
  273. 'RS' => array(1 => '/^[\x{002D}\x{0030}-\x{0039}\x{0061}-\x{007A}\x{0107}\x{010D}\x{0111}\x{0161}\x{017E}]{1,63}$/iu)'),
  274. 'RU' => array(1 => '/^[\x{002d}0-9а-яё]{1,63}$/iu'),
  275. 'SA' => array(1 => '/^[\x{002d}.0-9\x{0621}-\x{063A}\x{0641}-\x{064A}\x{0660}-\x{0669}]{1,63}$/iu'),
  276. 'SE' => array(1 => '/^[\x{002d}0-9a-zäåéöü]{1,63}$/iu'),
  277. 'SH' => array(1 => '/^[\x{002d}0-9a-zà-öø-ÿăąāćĉčċďđĕěėęēğĝġģĥħĭĩįīıĵķĺľļłńňņŋŏőōœĸŕřŗśŝšşťţŧŭůűũųūŵŷźžż]{1,63}$/iu'),
  278. 'SI' => array(
  279. 1 => '/^[\x{002d}0-9a-zà-öø-ÿ]{1,63}$/iu',
  280. 2 => '/^[\x{002d}0-9a-zāăąćĉċčďđēĕėęěĝğġģĥħĩīĭįıĵķĺļľŀłńņňʼnŋōŏőœŕŗřśŝšťŧũūŭůűųŵŷźżž]{1,63}$/iu',
  281. 3 => '/^[\x{002d}0-9a-zșț]{1,63}$/iu'),
  282. 'SJ' => array(1 => '/^[\x{002d}0-9a-zàáä-éêñ-ôöøüčđńŋšŧž]{1,63}$/iu'),
  283. 'TH' => array(1 => '/^[\x{002d}0-9a-z\x{0E01}-\x{0E3A}\x{0E40}-\x{0E4D}\x{0E50}-\x{0E59}]{1,63}$/iu'),
  284. 'TM' => array(1 => '/^[\x{002d}0-9a-zà-öø-ÿāăąćĉċčďđēėęěĝġģĥħīįĵķĺļľŀłńņňŋőœŕŗřśŝşšţťŧūŭůűųŵŷźżž]{1,63}$/iu'),
  285. 'TW' => 'Zend/Validate/Hostname/Cn.php',
  286. 'TR' => array(1 => '/^[\x{002d}0-9a-zğıüşöç]{1,63}$/iu'),
  287. 'UA' => array(1 => '/^[\x{002d}0-9a-zабвгдежзийклмнопрстуфхцчшщъыьэюяѐёђѓєѕіїјљњћќѝўџґӂʼ]{1,63}$/iu'),
  288. 'VE' => array(1 => '/^[\x{002d}0-9a-záéíóúüñ]{1,63}$/iu'),
  289. 'VN' => array(1 => '/^[ÀÁÂÃÈÉÊÌÍÒÓÔÕÙÚÝàáâãèéêìíòóôõùúýĂăĐđĨĩŨũƠơƯư\x{1EA0}-\x{1EF9}]{1,63}$/iu'),
  290. 'ایران' => array(1 => '/^[\x{0621}-\x{0624}\x{0626}-\x{063A}\x{0641}\x{0642}\x{0644}-\x{0648}\x{067E}\x{0686}\x{0698}\x{06A9}\x{06AF}\x{06CC}\x{06F0}-\x{06F9}]{1,30}$/iu'),
  291. '中国' => 'Zend/Validate/Hostname/Cn.php',
  292. '公司' => 'Zend/Validate/Hostname/Cn.php',
  293. '网络' => 'Zend/Validate/Hostname/Cn.php'
  294. );
  295. protected $_idnLength = array(
  296. 'BIZ' => array(5 => 17, 11 => 15, 12 => 20),
  297. 'CN' => array(1 => 20),
  298. 'COM' => array(3 => 17, 5 => 20),
  299. 'HK' => array(1 => 15),
  300. 'INFO'=> array(4 => 17),
  301. 'KR' => array(1 => 17),
  302. 'NET' => array(3 => 17, 5 => 20),
  303. 'ORG' => array(6 => 17),
  304. 'TW' => array(1 => 20),
  305. 'ایران' => array(1 => 30),
  306. '中国' => array(1 => 20),
  307. '公司' => array(1 => 20),
  308. '网络' => array(1 => 20),
  309. );
  310. protected $_options = array(
  311. 'allow' => self::ALLOW_DNS,
  312. 'idn' => true,
  313. 'tld' => true,
  314. 'ip' => null
  315. );
  316. /**
  317. * Sets validator options
  318. *
  319. * @param integer $allow OPTIONAL Set what types of hostname to allow (default ALLOW_DNS)
  320. * @param boolean $validateIdn OPTIONAL Set whether IDN domains are validated (default true)
  321. * @param boolean $validateTld OPTIONAL Set whether the TLD element of a hostname is validated (default true)
  322. * @param Zend_Validate_Ip $ipValidator OPTIONAL
  323. * @return void
  324. * @see http://www.iana.org/cctld/specifications-policies-cctlds-01apr02.htm Technical Specifications for ccTLDs
  325. */
  326. public function __construct($options = array())
  327. {
  328. if ($options instanceof Zend_Config) {
  329. $options = $options->toArray();
  330. } else if (!is_array($options)) {
  331. $options = func_get_args();
  332. $temp['allow'] = array_shift($options);
  333. if (!empty($options)) {
  334. $temp['idn'] = array_shift($options);
  335. }
  336. if (!empty($options)) {
  337. $temp['tld'] = array_shift($options);
  338. }
  339. if (!empty($options)) {
  340. $temp['ip'] = array_shift($options);
  341. }
  342. $options = $temp;
  343. }
  344. $options += $this->_options;
  345. $this->setOptions($options);
  346. }
  347. /**
  348. * Returns all set options
  349. *
  350. * @return array
  351. */
  352. public function getOptions()
  353. {
  354. return $this->_options;
  355. }
  356. /**
  357. * Sets the options for this validator
  358. *
  359. * @param array $options
  360. * @return Zend_Validate_Hostname
  361. */
  362. public function setOptions($options)
  363. {
  364. if (array_key_exists('allow', $options)) {
  365. $this->setAllow($options['allow']);
  366. }
  367. if (array_key_exists('idn', $options)) {
  368. $this->setValidateIdn($options['idn']);
  369. }
  370. if (array_key_exists('tld', $options)) {
  371. $this->setValidateTld($options['tld']);
  372. }
  373. if (array_key_exists('ip', $options)) {
  374. $this->setIpValidator($options['ip']);
  375. }
  376. return $this;
  377. }
  378. /**
  379. * Returns the set ip validator
  380. *
  381. * @return Zend_Validate_Ip
  382. */
  383. public function getIpValidator()
  384. {
  385. return $this->_options['ip'];
  386. }
  387. /**
  388. * @param Zend_Validate_Ip $ipValidator OPTIONAL
  389. * @return void;
  390. */
  391. public function setIpValidator(Zend_Validate_Ip $ipValidator = null)
  392. {
  393. if ($ipValidator === null) {
  394. $ipValidator = new Zend_Validate_Ip();
  395. }
  396. $this->_options['ip'] = $ipValidator;
  397. return $this;
  398. }
  399. /**
  400. * Returns the allow option
  401. *
  402. * @return integer
  403. */
  404. public function getAllow()
  405. {
  406. return $this->_options['allow'];
  407. }
  408. /**
  409. * Sets the allow option
  410. *
  411. * @param integer $allow
  412. * @return Zend_Validate_Hostname Provides a fluent interface
  413. */
  414. public function setAllow($allow)
  415. {
  416. $this->_options['allow'] = $allow;
  417. return $this;
  418. }
  419. /**
  420. * Returns the set idn option
  421. *
  422. * @return boolean
  423. */
  424. public function getValidateIdn()
  425. {
  426. return $this->_options['idn'];
  427. }
  428. /**
  429. * Set whether IDN domains are validated
  430. *
  431. * This only applies when DNS hostnames are validated
  432. *
  433. * @param boolean $allowed Set allowed to true to validate IDNs, and false to not validate them
  434. */
  435. public function setValidateIdn ($allowed)
  436. {
  437. $this->_options['idn'] = (bool) $allowed;
  438. return $this;
  439. }
  440. /**
  441. * Returns the set tld option
  442. *
  443. * @return boolean
  444. */
  445. public function getValidateTld()
  446. {
  447. return $this->_options['tld'];
  448. }
  449. /**
  450. * Set whether the TLD element of a hostname is validated
  451. *
  452. * This only applies when DNS hostnames are validated
  453. *
  454. * @param boolean $allowed Set allowed to true to validate TLDs, and false to not validate them
  455. */
  456. public function setValidateTld ($allowed)
  457. {
  458. $this->_options['tld'] = (bool) $allowed;
  459. return $this;
  460. }
  461. /**
  462. * Defined by Zend_Validate_Interface
  463. *
  464. * Returns true if and only if the $value is a valid hostname with respect to the current allow option
  465. *
  466. * @param string $value
  467. * @throws Zend_Validate_Exception if a fatal error occurs for validation process
  468. * @return boolean
  469. */
  470. public function isValid($value)
  471. {
  472. if (!is_string($value)) {
  473. $this->_error(self::INVALID);
  474. return false;
  475. }
  476. $this->_setValue($value);
  477. // Check input against IP address schema
  478. if (preg_match('/^[0-9a-f:.]*$/i', $value) &&
  479. $this->_options['ip']->setTranslator($this->getTranslator())->isValid($value)) {
  480. if (!($this->_options['allow'] & self::ALLOW_IP)) {
  481. $this->_error(self::IP_ADDRESS_NOT_ALLOWED);
  482. return false;
  483. } else {
  484. return true;
  485. }
  486. }
  487. // RFC3986 3.2.2 states:
  488. //
  489. // The rightmost domain label of a fully qualified domain name
  490. // in DNS may be followed by a single "." and should be if it is
  491. // necessary to distinguish between the complete domain name and
  492. // some local domain.
  493. //
  494. // (see ZF-6363)
  495. // Local hostnames are allowed to be partitial (ending '.')
  496. if ($this->_options['allow'] & self::ALLOW_LOCAL) {
  497. if (substr($value, -1) === '.') {
  498. $value = substr($value, 0, -1);
  499. if (substr($value, -1) === '.') {
  500. // Empty hostnames (ending '..') are not allowed
  501. $this->_error(self::INVALID_LOCAL_NAME);
  502. return false;
  503. }
  504. }
  505. }
  506. $domainParts = explode('.', $value);
  507. // Prevent partitial IP V4 adresses (ending '.')
  508. if ((count($domainParts) == 4) && preg_match('/^[0-9.a-e:.]*$/i', $value) &&
  509. $this->_options['ip']->setTranslator($this->getTranslator())->isValid($value)) {
  510. $this->_error(self::INVALID_LOCAL_NAME);
  511. }
  512. // Check input against DNS hostname schema
  513. if ((count($domainParts) > 1) && (strlen($value) >= 4) && (strlen($value) <= 254)) {
  514. $status = false;
  515. $origenc = iconv_get_encoding('internal_encoding');
  516. iconv_set_encoding('internal_encoding', 'UTF-8');
  517. do {
  518. // First check TLD
  519. $matches = array();
  520. if (preg_match('/([^.]{2,10})$/i', end($domainParts), $matches) ||
  521. (end($domainParts) == 'ایران') || (end($domainParts) == '中国') ||
  522. (end($domainParts) == '公司') || (end($domainParts) == '网络')) {
  523. reset($domainParts);
  524. // Hostname characters are: *(label dot)(label dot label); max 254 chars
  525. // label: id-prefix [*ldh{61} id-prefix]; max 63 chars
  526. // id-prefix: alpha / digit
  527. // ldh: alpha / digit / dash
  528. // Match TLD against known list
  529. $this->_tld = strtolower($matches[1]);
  530. if ($this->_options['tld']) {
  531. if (!in_array($this->_tld, $this->_validTlds)) {
  532. $this->_error(self::UNKNOWN_TLD);
  533. $status = false;
  534. break;
  535. }
  536. }
  537. /**
  538. * Match against IDN hostnames
  539. * Note: Keep label regex short to avoid issues with long patterns when matching IDN hostnames
  540. * @see Zend_Validate_Hostname_Interface
  541. */
  542. $regexChars = array(0 => '/^[a-z0-9\x2d]{1,63}$/i');
  543. if ($this->_options['idn'] && isset($this->_validIdns[strtoupper($this->_tld)])) {
  544. if (is_string($this->_validIdns[strtoupper($this->_tld)])) {
  545. $regexChars += include($this->_validIdns[strtoupper($this->_tld)]);
  546. } else {
  547. $regexChars += $this->_validIdns[strtoupper($this->_tld)];
  548. }
  549. }
  550. // Check each hostname part
  551. $check = 0;
  552. foreach ($domainParts as $domainPart) {
  553. // Decode Punycode domainnames to IDN
  554. if (strpos($domainPart, 'xn--') === 0) {
  555. $domainPart = $this->decodePunycode(substr($domainPart, 4));
  556. if ($domainPart === false) {
  557. return false;
  558. }
  559. }
  560. // Check dash (-) does not start, end or appear in 3rd and 4th positions
  561. if ((strpos($domainPart, '-') === 0)
  562. || ((strlen($domainPart) > 2) && (strpos($domainPart, '-', 2) == 2) && (strpos($domainPart, '-', 3) == 3))
  563. || (strpos($domainPart, '-') === (strlen($domainPart) - 1))) {
  564. $this->_error(self::INVALID_DASH);
  565. $status = false;
  566. break 2;
  567. }
  568. // Check each domain part
  569. $checked = false;
  570. foreach($regexChars as $regexKey => $regexChar) {
  571. $status = @preg_match($regexChar, $domainPart);
  572. if ($status > 0) {
  573. $length = 63;
  574. if (array_key_exists(strtoupper($this->_tld), $this->_idnLength)
  575. && (array_key_exists($regexKey, $this->_idnLength[strtoupper($this->_tld)]))) {
  576. $length = $this->_idnLength[strtoupper($this->_tld)];
  577. }
  578. if (iconv_strlen($domainPart, 'UTF-8') > $length) {
  579. $this->_error(self::INVALID_HOSTNAME);
  580. } else {
  581. $checked = true;
  582. break;
  583. }
  584. }
  585. }
  586. if ($checked) {
  587. ++$check;
  588. }
  589. }
  590. // If one of the labels doesn't match, the hostname is invalid
  591. if ($check !== count($domainParts)) {
  592. $this->_error(self::INVALID_HOSTNAME_SCHEMA);
  593. $status = false;
  594. }
  595. } else {
  596. // Hostname not long enough
  597. $this->_error(self::UNDECIPHERABLE_TLD);
  598. $status = false;
  599. }
  600. } while (false);
  601. iconv_set_encoding('internal_encoding', $origenc);
  602. // If the input passes as an Internet domain name, and domain names are allowed, then the hostname
  603. // passes validation
  604. if ($status && ($this->_options['allow'] & self::ALLOW_DNS)) {
  605. return true;
  606. }
  607. } else if ($this->_options['allow'] & self::ALLOW_DNS) {
  608. $this->_error(self::INVALID_HOSTNAME);
  609. }
  610. // Check for URI Syntax (RFC3986)
  611. if ($this->_options['allow'] & self::ALLOW_URI) {
  612. if (preg_match("/^([a-zA-Z0-9-._~!$&\'()*+,;=]|%[[:xdigit:]]{2}){1,254}$/i", $value)) {
  613. return true;
  614. } else {
  615. $this->_error(self::INVALID_URI);
  616. }
  617. }
  618. // Check input against local network name schema; last chance to pass validation
  619. $regexLocal = '/^(([a-zA-Z0-9\x2d]{1,63}\x2e)*[a-zA-Z0-9\x2d]{1,63}[\x2e]{0,1}){1,254}$/';
  620. $status = @preg_match($regexLocal, $value);
  621. // If the input passes as a local network name, and local network names are allowed, then the
  622. // hostname passes validation
  623. $allowLocal = $this->_options['allow'] & self::ALLOW_LOCAL;
  624. if ($status && $allowLocal) {
  625. return true;
  626. }
  627. // If the input does not pass as a local network name, add a message
  628. if (!$status) {
  629. $this->_error(self::INVALID_LOCAL_NAME);
  630. }
  631. // If local network names are not allowed, add a message
  632. if ($status && !$allowLocal) {
  633. $this->_error(self::LOCAL_NAME_NOT_ALLOWED);
  634. }
  635. return false;
  636. }
  637. /**
  638. * Decodes a punycode encoded string to it's original utf8 string
  639. * In case of a decoding failure the original string is returned
  640. *
  641. * @param string $encoded Punycode encoded string to decode
  642. * @return string
  643. */
  644. protected function decodePunycode($encoded)
  645. {
  646. $found = preg_match('/([^a-z0-9\x2d]{1,10})$/i', $encoded);
  647. if (empty($encoded) || ($found > 0)) {
  648. // no punycode encoded string, return as is
  649. $this->_error(self::CANNOT_DECODE_PUNYCODE);
  650. return false;
  651. }
  652. $separator = strrpos($encoded, '-');
  653. if ($separator > 0) {
  654. for ($x = 0; $x < $separator; ++$x) {
  655. // prepare decoding matrix
  656. $decoded[] = ord($encoded[$x]);
  657. }
  658. } else {
  659. $this->_error(self::CANNOT_DECODE_PUNYCODE);
  660. return false;
  661. }
  662. $lengthd = count($decoded);
  663. $lengthe = strlen($encoded);
  664. // decoding
  665. $init = true;
  666. $base = 72;
  667. $index = 0;
  668. $char = 0x80;
  669. for ($indexe = ($separator) ? ($separator + 1) : 0; $indexe < $lengthe; ++$lengthd) {
  670. for ($old_index = $index, $pos = 1, $key = 36; 1 ; $key += 36) {
  671. $hex = ord($encoded[$indexe++]);
  672. $digit = ($hex - 48 < 10) ? $hex - 22
  673. : (($hex - 65 < 26) ? $hex - 65
  674. : (($hex - 97 < 26) ? $hex - 97
  675. : 36));
  676. $index += $digit * $pos;
  677. $tag = ($key <= $base) ? 1 : (($key >= $base + 26) ? 26 : ($key - $base));
  678. if ($digit < $tag) {
  679. break;
  680. }
  681. $pos = (int) ($pos * (36 - $tag));
  682. }
  683. $delta = intval($init ? (($index - $old_index) / 700) : (($index - $old_index) / 2));
  684. $delta += intval($delta / ($lengthd + 1));
  685. for ($key = 0; $delta > 910 / 2; $key += 36) {
  686. $delta = intval($delta / 35);
  687. }
  688. $base = intval($key + 36 * $delta / ($delta + 38));
  689. $init = false;
  690. $char += (int) ($index / ($lengthd + 1));
  691. $index %= ($lengthd + 1);
  692. if ($lengthd > 0) {
  693. for ($i = $lengthd; $i > $index; $i--) {
  694. $decoded[$i] = $decoded[($i - 1)];
  695. }
  696. }
  697. $decoded[$index++] = $char;
  698. }
  699. // convert decoded ucs4 to utf8 string
  700. foreach ($decoded as $key => $value) {
  701. if ($value < 128) {
  702. $decoded[$key] = chr($value);
  703. } elseif ($value < (1 << 11)) {
  704. $decoded[$key] = chr(192 + ($value >> 6));
  705. $decoded[$key] .= chr(128 + ($value & 63));
  706. } elseif ($value < (1 << 16)) {
  707. $decoded[$key] = chr(224 + ($value >> 12));
  708. $decoded[$key] .= chr(128 + (($value >> 6) & 63));
  709. $decoded[$key] .= chr(128 + ($value & 63));
  710. } elseif ($value < (1 << 21)) {
  711. $decoded[$key] = chr(240 + ($value >> 18));
  712. $decoded[$key] .= chr(128 + (($value >> 12) & 63));
  713. $decoded[$key] .= chr(128 + (($value >> 6) & 63));
  714. $decoded[$key] .= chr(128 + ($value & 63));
  715. } else {
  716. $this->_error(self::CANNOT_DECODE_PUNYCODE);
  717. return false;
  718. }
  719. }
  720. return implode($decoded);
  721. }
  722. }