extract VT mails deduped

This commit is contained in:
Clara Dautermann 2025-04-08 19:34:51 +02:00
parent 244b77ea13
commit 833dfd852c
Signed by: clara
GPG key ID: 223391B52FAD4463

75
analyzer.ipynb Normal file
View file

@ -0,0 +1,75 @@
{
"cells": [
{
"cell_type": "code",
"execution_count": 1,
"metadata": {},
"outputs": [],
"source": [
"import json"
]
},
{
"cell_type": "code",
"execution_count": 36,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"275 entries loaded.\n",
"169 with email.\n",
"89 with VT.\n",
"73 without duplicates.\n",
"info@psychotherapie-eitel.de, psychotherapie-spindler@web.de, praxis-v-kollenbaum@gmx.de, mail@praxis-sentuerk.de, info@praxis-kusche-mall.de, moers@psychotherapie-halbeis.de, praxis.stracke@tuta.com, praxis@schimanski-psychotherapie.de, praxisdoerner@gmx.de, buergerpraxiska@online.de, info@mrl-praxis.de, psychotherapie-koeck@posteo.de, psychotherapie.haeusser@gmx.com, praxis@psychotherapie-dölker.de, j.schmidt@praxis-p3.de, info@praxislott.de, hafferisabel@aol.com, praxis@psychotherapiewissen.de, praxis@psychotherapielutz.de, shrink1@web.de, praxis.klene-gaspard@t-online.de, kvt.diez@gmail.com, mail@gertrud-fahnenbruck.de, praxis.reventlow@gmx.de, noreen.weiler@protonmail.com, praxis@michael-schwehn.de, answer@stahl-eversberg.de, praxis@psychiatricum-ka.de, praxis.urban@outlook.com, praxis@brening-becker.de, praxis@drdamian.de, info@ptvo.de, praxis@wieske.de, hansbiewer@web.de, info@psychotherapiepraxis-borovac.de, praxis.friedebach@web.de, praxis@julia-luecke.de, kontakt@psychotherapie-heuser.de, info@praxis-seekircher.de, mail@psychotherapie-klingel.de, praxis@helma-blaurock.de, praxis@psychotherapie-okello.de, psychotherapie@bianca-maria-ehbauer.de, therapeut.schorn@web.de, praxis-burkart@t-online.de, mail@psychotherapie-schauer.de, praxis@erb-bies.de, praxis@psychotherapie-senger.de, kontakt@hm-psychotherapie.de, bikai@t-online.de, info@psychotherapie-merkens.de, claudia-lehner@t-online.de, praxis.reinartz@t-online.de, praxis@neurologie-psychiatrie-karlsruhe.de, mueller-aunda@web.de, wolf-vtp@web.de, praxis.leufke@gmail.com, kontakt@zeneka.de, mail@rieger-psychotherapie.de, info@praxis-sentuerk.de, goeke.g@web.de, martina.eckrich@web.de, mail@praxis-katja-beck.de, praxis-vollmann@posteo.de, psychotherapie-barton@web.de, baschnagel@psychotherapie-halbeis.de, psychotherapie-neumann@gmx.de, info@praxis-heckenlaible.de, praxis.kugele@gmail.com, hagenpraxiska@online.de, pt-juergens@web.de, kontakt@psychotherapie-neureut.de, gia.nakat@gmail.com\n"
]
}
],
"source": [
"with open('./data/therapists.json', 'r') as infile:\n",
" loaded = json.load(infile)\n",
"\n",
"print(f'{len(loaded)} entries loaded.')\n",
"\n",
"with_mail = list(filter(lambda entry: 'mails' in entry, loaded))\n",
"print(f'{len(with_mail)} with email.')\n",
"\n",
"with_vt = list(filter(lambda entry: 'Verhaltenstherapeutische Einzeltherapie Erwachsene' in entry['therapy_types'], with_mail))\n",
"print(f'{len(with_vt)} with VT.')\n",
"\n",
"allmails = []\n",
"\n",
"for entry in with_vt:\n",
" allmails += list(map(lambda mail: mail.lower(), entry['mails']))\n",
"\n",
"allmails = list(set(allmails))\n",
"\n",
"print(f'{len(allmails)} without duplicates.')\n",
"\n",
"print(\", \".join(allmails))"
]
}
],
"metadata": {
"kernelspec": {
"display_name": "python-minimal kernel",
"language": "python",
"name": "python-minimal"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.12.7"
}
},
"nbformat": 4,
"nbformat_minor": 2
}