About: Convert HTML entities   Sponge Permalink

An Entity of Type : owl:Thing, within Data Space : 134.155.108.49:8890 associated with source dataset(s)

This is a function that will convert HTML entities (such as , ", etc.) into their Unicode string representations. If you're scraping some sort of HTML or XML, it would be smart to run this function on your strings after you've pulled out the text you want. Call deEnt(myString). The value returned is the de-entified string. Call reEnt(myString). The value returned is the re-entified string.

AttributesValues
rdfs:label
  • Convert HTML entities
rdfs:comment
  • This is a function that will convert HTML entities (such as , ", etc.) into their Unicode string representations. If you're scraping some sort of HTML or XML, it would be smart to run this function on your strings after you've pulled out the text you want. Call deEnt(myString). The value returned is the de-entified string. Call reEnt(myString). The value returned is the re-entified string.
dcterms:subject
abstract
  • This is a function that will convert HTML entities (such as , ", etc.) into their Unicode string representations. If you're scraping some sort of HTML or XML, it would be smart to run this function on your strings after you've pulled out the text you want. This function converts entities in decimal, hex, and keyword formats. It also replaces Windows Latin-1 (CP 1252) characters with their correct Unicode equivalents. If you are having problems with some characters, you may want to try disabling CP 1252 conversion. Just replace the lines defining the commonASCII object with const commonASCII = new Object();. Call deEnt(myString). The value returned is the de-entified string. function deEnt( s ) { s = s.replace( /&([^;]+);/g, doReplace ); return s; } function doReplace( str, p1 ) { if ( p1[ 0 ] == "#" ) { p1 = p1.substr( 1 ); if ( p1[ 0 ] == "x" ) p1 = parseInt( p1.match( /[a-f0-9]+$/i ), 16 ); if ( commonASCII[ p1 ] ) return commonASCII[ p1 ]; else return String.fromCharCode( p1 ); } else { return commonEntities[ p1 ]; } } const commonASCII = { 128:"\u20AC",130:"\u201A",131:"\u0192",132:"\u201E",133:"\u2026",134:"\u2020", 135:"\u2021",136:"\u02C6",137:"\u2030",138:"\u0160",139:"\u2039",140:"\u0152", 141:"",142:"\u017D",143:"",144:"",145:"\u2018",146:"\u2019",147:"\u201C", 148:"\u201D",149:"\u2022",150:"\u2013",151:"\u2014",152:"\u02DC",153:"\u2122", 154:"\u0161",155:"\u203A",156:"\u0153",157:"",158:"\u017E",159:"\u0178" }; const commonEntities = { "quot":"\u0022","amp":"\u0026","lt":"\u003C","gt":"\u003E","nbsp":"\u0020","iexcl":"\u00A1","cent":"\u00A2","pound":"\u00A3", "curren":"\u00A4","yen":"\u00A5","brvbar":"\u00A6","sect":"\u00A7","uml":"\u00A8","copy":"\u00A9","ordf":"\u00AA","laquo":"\u00AB", "not":"\u00AC","shy":"\u000A","reg":"\u00AE","macr":"\u00AF","deg":"\u00B0","plusmn":"\u00B1","sup2":"\u00B2","sup3":"\u00B3", "acute":"\u00B4","micro":"\u00B5","para":"\u00B6","middot":"\u00B7","cedil":"\u00B8","sup1":"\u00B9","ordm":"\u00BA","raquo":"\u00BB", "frac14":"\u00BC","frac12":"\u00BD","frac34":"\u00BE","iquest":"\u00BF","Agrave":"\u00C0","Aacute":"\u00C1","Acirc":"\u00C2", "Atilde":"\u00C3","Auml":"\u00C4","Aring":"\u00C5","AElig":"\u00C6","Ccedil":"\u00C7","Egrave":"\u00C8","Eacute":"\u00C9", "Ecirc":"\u00CA","Euml":"\u00CB","Igrave":"\u00CC","Iacute":"\u00CD","Icirc":"\u00CE","Iuml":"\u00CF","ETH":"\u00D0","Ntilde":"\u00D1", "Ograve":"\u00D2","Oacute":"\u00D3","Ocirc":"\u00D4","Otilde":"\u00D5","Ouml":"\u00D6","times":"\u00D7","Oslash":"\u00D8", "Ugrave":"\u00D9","Uacute":"\u00DA","Ucirc":"\u00DB","Uuml":"\u00DC","Yacute":"\u00DD","THORN":"\u00DE","szlig":"\u00DF", "agrave":"\u00E0","aacute":"\u00E1","acirc":"\u00E2","atilde":"\u00E3","auml":"\u00E4","aring":"\u00E5","aelig":"\u00E6", "ccedil":"\u00E7","egrave":"\u00E8","eacute":"\u00E9","ecirc":"\u00EA","euml":"\u00EB","igrave":"\u00EC","iacute":"\u00ED", "icirc":"\u00EE","iuml":"\u00EF","eth":"\u00F0","ntilde":"\u00F1","ograve":"\u00F2","oacute":"\u00F3","ocirc":"\u00F4","otilde":"\u00F5", "ouml":"\u00F6","divide":"\u00F7","oslash":"\u00F8","ugrave":"\u00F9","uacute":"\u00FA","ucirc":"\u00FB","uuml":"\u00FC", "yacute":"\u00FD","thorn":"\u00FE","yuml":"\u00FF","OElig":"\u0152","oelig":"\u0153","Scaron":"\u0160","scaron":"\u0161","Yuml":"\u0178", "fnof":"\u0192","circ":"\u02C6","tilde":"\u02DC","Alpha":"\u0391","Beta":"\u0392","Gamma":"\u0393","Delta":"\u0394","Epsilon":"\u0395", "Zeta":"\u0396","Eta":"\u0397","Theta":"\u0398","Iota":"\u0399","Kappa":"\u039A","Lambda":"\u039B","Mu":"\u039C","Nu":"\u039D", "Xi":"\u039E","Omicron":"\u039F","Pi":"\u03A0","Rho":"\u03A1","Sigma":"\u03A3","Tau":"\u03A4","Upsilon":"\u03A5","Phi":"\u03A6", "Chi":"\u03A7","Psi":"\u03A8","Omega":"\u03A9","alpha":"\u03B1","beta":"\u03B2","gamma":"\u03B3","delta":"\u03B4","epsilon":"\u03B5", "zeta":"\u03B6","eta":"\u03B7","theta":"\u03B8","iota":"\u03B9","kappa":"\u03BA","lambda":"\u03BB","mu":"\u03BC","nu":"\u03BD", "xi":"\u03BE","omicron":"\u03BF","pi":"\u03C0","rho":"\u03C1","sigmaf":"\u03C2","sigma":"\u03C3","tau":"\u03C4","upsilon":"\u03C5", "phi":"\u03C6","chi":"\u03C7","psi":"\u03C8","omega":"\u03C9","thetasym":"\u03D1","upsih":"\u03D2","piv":"\u03D6","ensp":"\u2002", "emsp":"\u2003","thinsp":"\u2009","zwnj":"\u200C","zwj":"\u200D","lrm":"\u200E","rlm":"\u200F","ndash":"\u2013","mdash":"\u2014", "lsquo":"\u2018","rsquo":"\u2019","sbquo":"\u201A","ldquo":"\u201C","rdquo":"\u201D","bdquo":"\u201E","dagger":"\u2020","Dagger":"\u2021", "bull":"\u2022","hellip":"\u2026","permil":"\u2030","prime":"\u2032","Prime":"\u2033","lsaquo":"\u2039","rsaquo":"\u203A","oline":"\u203E", "frasl":"\u2044","euro":"\u20AC","image":"\u2111","weierp":"\u2118","real":"\u211C","trade":"\u2122","alefsym":"\u2135","larr":"\u2190", "uarr":"\u2191","rarr":"\u2192","darr":"\u2193","harr":"\u2194","crarr":"\u21B5","lArr":"\u21D0","uArr":"\u21D1","rArr":"\u21D2", "dArr":"\u21D3","hArr":"\u21D4","forall":"\u2200","part":"\u2202","exist":"\u2203","empty":"\u2205","nabla":"\u2207","isin":"\u2208", "notin":"\u2209","ni":"\u220B","prod":"\u220F","sum":"\u2211","minus":"\u2212","lowast":"\u2217","radic":"\u221A","prop":"\u221D", "infin":"\u221E","ang":"\u2220","and":"\u2227","or":"\u2228","cap":"\u2229","cup":"\u222A","int":"\u222B","there4":"\u2234","sim":"\u223C", "cong":"\u2245","asymp":"\u2248","ne":"\u2260","equiv":"\u2261","le":"\u2264","ge":"\u2265","sub":"\u2282","sup":"\u2283","nsub":"\u2284", "sube":"\u2286","supe":"\u2287","oplus":"\u2295","otimes":"\u2297","perp":"\u22A5","sdot":"\u22C5","lceil":"\u2308","rceil":"\u2309", "lfloor":"\u230A","rfloor":"\u230B","lang":"\u2329","rang":"\u232A","loz":"\u25CA","spades":"\u2660","clubs":"\u2663","hearts":"\u2665", "diams":"\u2666" }; Call reEnt(myString). The value returned is the re-entified string. function reEnt(s, heavy) { var safeChars; var r = ""; if (heavy) { // Heavy - convert EVERY character into an HTML entity safeChars = /[]/; } else { // Edit the line below to add more "safe" (non-entified) characters safeChars = /[a-zA-Z0-9 \-]/; } for (var i = 0; i < s.length; i++) { if (safeChars.test(s.charAt(i))) { r += s.charAt(i); } else { r += "&#" + s.charCodeAt(i) + ";"; } } return r; }
Alternative Linked Data Views: ODE     Raw Data in: CXML | CSV | RDF ( N-Triples N3/Turtle JSON XML ) | OData ( Atom JSON ) | Microdata ( JSON HTML) | JSON-LD    About   
This material is Open Knowledge   W3C Semantic Web Technology [RDF Data] Valid XHTML + RDFa
OpenLink Virtuoso version 07.20.3217, on Linux (x86_64-pc-linux-gnu), Standard Edition
Data on this page belongs to its respective rights holders.
Virtuoso Faceted Browser Copyright © 2009-2012 OpenLink Software