The group you are posting to is a Usenet group. Messages posted to this group will make your email address visible to anyone on the Internet.
Your reply message has not been sent.
Your post was successful
 |
From: Zabrane Mickael <zabra...@gmail.com>
Date: Tue, 25 Sep 2012 20:02:06 +0200
Local: Tues, Sep 25 2012 2:02 pm
Subject: [erlang-questions] Unescape HTML text
You must Sign in before you can post messages.
You do not have the permission required to post.
|
 |
From: Zabrane Mickael <zabra...@gmail.com>
Date: Tue, 25 Sep 2012 20:48:15 +0200
Local: Tues, Sep 25 2012 2:48 pm
Subject: Re: [erlang-questions] Unescape HTML text
answering my own question:
unescape(<<>>) -> <<>>;
unescape([]) ->
<<>>;
unescape(L) when is_list(L) ->
unescape(list_to_binary(L));
unescape(B) when is_binary(B) ->
unescape(B, <<>>).
unescape(<<>>, Acc) -> Acc;
unescape(<<" ", T/binary>>, Acc) ->
unescape(T, <<Acc/binary, " ">>);
unescape(<<"&", T/binary>>, Acc) ->
unescape(T, <<Acc/binary, "&">>);
unescape(<<""", T/binary>>, Acc) ->
unescape(T, <<Acc/binary, "\"">>);
unescape(<<"'", T/binary>>, Acc) ->
unescape(T, <<Acc/binary, "\'">>);
unescape(<<"'", T/binary>>, Acc) ->
unescape(T, <<Acc/binary, "'">>);
unescape(<<"<", T/binary>>, Acc) ->
unescape(T, <<Acc/binary, "<">>);
unescape(<<">", T/binary>>, Acc) ->
unescape(T, <<Acc/binary, ">">>);
unescape(<<"€", T/binary>>, Acc) ->
unescape(T, <<Acc/binary, "€">>);
unescape(<<"ç", T/binary>>, Acc) ->
unescape(T, <<Acc/binary, "ç">>);
unescape(<<"à", T/binary>>, Acc) ->
unescape(T, <<Acc/binary, "à">>);
unescape(<<"â", T/binary>>, Acc) ->
unescape(T, <<Acc/binary, "â">>);
unescape(<<"ä", T/binary>>, Acc) ->
unescape(T, <<Acc/binary, "ä">>);
unescape(<<"æ", T/binary>>, Acc) ->
unescape(T, <<Acc/binary, "æ">>);
unescape(<<"è", T/binary>>, Acc) ->
unescape(T, <<Acc/binary, "è">>);
unescape(<<"é", T/binary>>, Acc) ->
unescape(T, <<Acc/binary, "é">>);
unescape(<<"ê", T/binary>>, Acc) ->
unescape(T, <<Acc/binary, "ê">>);
unescape(<<"ë", T/binary>>, Acc) ->
unescape(T, <<Acc/binary, "ë">>);
unescape(<<"î", T/binary>>, Acc) ->
unescape(T, <<Acc/binary, "î">>);
unescape(<<"ï", T/binary>>, Acc) ->
unescape(T, <<Acc/binary, "ï">>);
unescape(<<"ö", T/binary>>, Acc) ->
unescape(T, <<Acc/binary, "ö">>);
unescape(<<"ù", T/binary>>, Acc) ->
unescape(T, <<Acc/binary, "ù">>);
unescape(<<"ú", T/binary>>, Acc) ->
unescape(T, <<Acc/binary, "ú">>);
unescape(<<"û", T/binary>>, Acc) ->
unescape(T, <<Acc/binary, "û">>);
unescape(<<"ü", T/binary>>, Acc) ->
unescape(T, <<Acc/binary, "ü">>);
unescape(<<C, T/binary>>, Acc) ->
unescape(T, <<Acc/binary, C>>).
Regards,
Zabrane
On Sep 25, 2012, at 8:02 PM, Zabrane Mickael wrote:
_______________________________________________
erlang-questions mailing list
erlang-questi...@erlang.org
http://erlang.org/mailman/listinfo/erlang-questions
You must Sign in before you can post messages.
You do not have the permission required to post.
|
 |
From: Bob Ippolito <b...@redivi.com>
Date: Tue, 25 Sep 2012 12:31:37 -0700
Local: Tues, Sep 25 2012 3:31 pm
Subject: Re: [erlang-questions] Unescape HTML text
That's a subset of possible inputs, you're better off using a library
that's a bit more complete. This may be useful:
https://github.com/mochi/mochiweb/blob/master/src/mochiweb_charref.erl
On Tue, Sep 25, 2012 at 11:48 AM, Zabrane Mickael <zabra...@gmail.com>wrote:
> answering my own question:
> unescape(<<>>) ->
> <<>>;
> unescape([]) ->
> <<>>;
> unescape(L) when is_list(L) ->
> unescape(list_to_binary(L));
> unescape(B) when is_binary(B) ->
> unescape(B, <<>>).
> unescape(<<>>, Acc) ->
> Acc;
> unescape(<<" ", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, " ">>);
> unescape(<<"&", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "&">>);
> unescape(<<""", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "\"">>);
> unescape(<<"'", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "\'">>);
> unescape(<<"'", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "'">>);
> unescape(<<"<", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "<">>);
> unescape(<<">", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, ">">>);
> unescape(<<"€", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "€">>);
> unescape(<<"ç", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "ç">>);
> unescape(<<"à", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "à">>);
> unescape(<<"â", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "â">>);
> unescape(<<"ä", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "ä">>);
> unescape(<<"æ", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "æ">>);
> unescape(<<"è", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "è">>);
> unescape(<<"é", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "é">>);
> unescape(<<"ê", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "ê">>);
> unescape(<<"ë", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "ë">>);
> unescape(<<"î", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "î">>);
> unescape(<<"ï", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "ï">>);
> unescape(<<"ö", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "ö">>);
> unescape(<<"ù", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "ù">>);
> unescape(<<"ú", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "ú">>);
> unescape(<<"û", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "û">>);
> unescape(<<"ü", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "ü">>);
> unescape(<<C, T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, C>>).
> Regards,
> Zabrane
> On Sep 25, 2012, at 8:02 PM, Zabrane Mickael wrote:
> Hi huis,
> I want to convert an HTML escaped text (
> http://www.w3schools.com/tags/ref_entities.asp) like this one:
> bourgé Cop
> to:
> bourgé Cop
> Is there any Erlang library for this?
> Regards,
> Zabrane
> _______________________________________________
> erlang-questions mailing list
> erlang-questi...@erlang.org
> http://erlang.org/mailman/listinfo/erlang-questions
_______________________________________________
erlang-questions mailing list
erlang-questi...@erlang.org
http://erlang.org/mailman/listinfo/erlang-questions
You must Sign in before you can post messages.
You do not have the permission required to post.
|
 |
From: Zabrane Mickael <zabra...@gmail.com>
Date: Tue, 25 Sep 2012 21:33:09 +0200
Local: Tues, Sep 25 2012 3:33 pm
Subject: Re: [erlang-questions] Unescape HTML text
Thanks Bob.
Exactly what I needed.
Regards,
Zabrane
On Sep 25, 2012, at 9:31 PM, Bob Ippolito wrote:
> That's a subset of possible inputs, you're better off using a library that's a bit more complete. This may be useful: https://github.com/mochi/mochiweb/blob/master/src/mochiweb_charref.erl
> On Tue, Sep 25, 2012 at 11:48 AM, Zabrane Mickael <zabra...@gmail.com> wrote:
> answering my own question:
> unescape(<<>>) -> > <<>>;
> unescape([]) ->
> <<>>;
> unescape(L) when is_list(L) ->
> unescape(list_to_binary(L));
> unescape(B) when is_binary(B) ->
> unescape(B, <<>>).
> unescape(<<>>, Acc) -> > Acc;
> unescape(<<" ", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, " ">>);
> unescape(<<"&", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "&">>);
> unescape(<<""", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "\"">>);
> unescape(<<"'", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "\'">>);
> unescape(<<"'", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "'">>);
> unescape(<<"<", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "<">>);
> unescape(<<">", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, ">">>);
> unescape(<<"€", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "€">>);
> unescape(<<"ç", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "ç">>);
> unescape(<<"à", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "à">>);
> unescape(<<"â", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "â">>);
> unescape(<<"ä", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "ä">>);
> unescape(<<"æ", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "æ">>);
> unescape(<<"è", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "è">>);
> unescape(<<"é", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "é">>);
> unescape(<<"ê", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "ê">>);
> unescape(<<"ë", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "ë">>);
> unescape(<<"î", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "î">>);
> unescape(<<"ï", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "ï">>);
> unescape(<<"ö", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "ö">>);
> unescape(<<"ù", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "ù">>);
> unescape(<<"ú", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "ú">>);
> unescape(<<"û", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "û">>);
> unescape(<<"ü", T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, "ü">>);
> unescape(<<C, T/binary>>, Acc) ->
> unescape(T, <<Acc/binary, C>>).
> Regards,
> Zabrane
> On Sep 25, 2012, at 8:02 PM, Zabrane Mickael wrote:
>> Hi huis,
>> I want to convert an HTML escaped text (http://www.w3schools.com/tags/ref_entities.asp) like this one:
>> bourgé Cop
>> to:
>> bourgé Cop
>> Is there any Erlang library for this?
>> Regards,
>> Zabrane
> _______________________________________________
> erlang-questions mailing list
> erlang-questi...@erlang.org
> http://erlang.org/mailman/listinfo/erlang-questions
_______________________________________________
erlang-questions mailing list
erlang-questi...@erlang.org
http://erlang.org/mailman/listinfo/erlang-questions
You must Sign in before you can post messages.
You do not have the permission required to post.
|
|
|