@inproceedings{WartenaGarciaAlsina2013, author = {Christian Wartena and Montserrat Garcia-Alsina}, title = {Challenges and Potentials for Keyword Extraction from Company Websites for the Development of Regional Knowledge Maps}, series = {Proceedings of the 5th International Conference on Knowledge Discovery and Information Retrieval (KDIR)}, doi = {10.25968/opus-391}, url = {http://nbn-resolving.de/urn:nbn:de:bsz:960-opus4-3911}, pages = {241 -- 248}, year = {2013}, abstract = {Regional Innovation Systems describe the relations between actors, structures and infrastructures in a region in order to stimulate innovation and regional development. For these systems the collection and organization of information is crucial. In the present paper we investigate the possibilities to extract information from websites of companies. First we describe regional innovation systems and the information types that are necessary to create them. Then we discuss the possibilities of text mining and keyword extraction techniques to extract this information from company websites. Finally, we describe a small scale experiment in which keywords related to economic sectors and commodities are extracted from the websites of over 200 companies. This experiment shows what the main challenges are for information extraction from websites for regional innovation systems.}, language = {en} }