[sr-dev] git:master: pdbt: fix URL for german carrier names, filtering is not yet working completely

Henning Westerholt henning.westerholt at 1und1.de
Mon Sep 13 19:13:03 CEST 2010


Module: sip-router
Branch: master
Commit: b2dd83b03c7c858b93b51112a7f134bef2a54c4f
URL:    http://git.sip-router.org/cgi-bin/gitweb.cgi/sip-router/?a=commit;h=b2dd83b03c7c858b93b51112a7f134bef2a54c4f

Author: Henning Westerholt <henning.westerholt at 1und1.de>
Committer: Henning Westerholt <henning.westerholt at 1und1.de>
Date:   Mon Sep 13 19:12:36 2010 +0200

pdbt: fix URL for german carrier names, filtering is not yet working completely

---

 utils/pdbt/scripts/get_carrier_names_germany.sh |    5 +++--
 1 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/utils/pdbt/scripts/get_carrier_names_germany.sh b/utils/pdbt/scripts/get_carrier_names_germany.sh
index 64bf83a..bb3bc6f 100755
--- a/utils/pdbt/scripts/get_carrier_names_germany.sh
+++ b/utils/pdbt/scripts/get_carrier_names_germany.sh
@@ -23,9 +23,10 @@
 # the 'Bundesnetzagentur' and convert this into the format which the pdbt tool
 # understands.
 
-url="http://www.bundesnetzagentur.de/enid/Portierungskennung/Verzeichnis_1ct.html"
+url="http://www.bundesnetzagentur.de/cln_1912/DE/Sachgebiete/Telekommunikation/RegulierungTelekommunikation/Nummernverwaltung/TechnischeNummern/Portierungskennung/VerzeichnisPortKenn_Basepage.html"
 
 # fix LOCALE problem during filtering 
 export LANG="C"
 
-wget -O - "$url" | recode latin1..utf8 | tr -d '\r' | tr '\n' '@' | sed 's/^.*Firma//' | sed 's/<\/table>.*$//' | tr '@' '\n' | sed 's/<\/p>/@/' | sed 's/<\/td>/@/' | egrep -v "^ *<" | tr -d '\n' | sed 's/@ *@/@/g' | tr '@' '\n' | sed 's/  */ /g' | sed 's/^ *//' | tr '\n' '@' | sed 's/\([^@]*\)@\(D[0-9][0-9][0-9]\)[^@]*@/\2 \1@/g' | tr '@' '\n' | sed 's/\&nbsp\;/ /g' | sed 's/\&amp\;/\&/g' | sed 's/  */ /g' | egrep -v '^$'
+wget -O - "$url" | recode latin1..utf8 | sed 's/^*.Verzeichnis der Portierungskennungen//' | awk '/<tbody>/, /<\/tbody>/' | tr -d '\r' | tr '\n' '@' | sed 's/<\/table>.*$//' | sed 's/<\/tbody>.*$//'
+




More information about the sr-dev mailing list