@article{VoelskeGollubHagenetal., author = {V{\"o}lske, Michael and Gollub, Tim and Hagen, Matthias and Stein, Benno}, title = {A keyquery-based classification system for CORE}, series = {D-Lib Magazine}, journal = {D-Lib Magazine}, doi = {10.1045/november14-voelske}, url = {http://nbn-resolving.de/urn:nbn:de:gbv:wim2-20170426-31662}, abstract = {We apply keyquery-based taxonomy composition to compute a classification system for the CORE dataset, a shared crawl of about 850,000 scientific papers. Keyquery-based taxonomy composition can be understood as a two-phase hierarchical document clustering technique that utilizes search queries as cluster labels: In a first phase, the document collection is indexed by a reference search engine, and the documents are tagged with the search queries they are relevant—for their so-called keyqueries. In a second phase, a hierarchical clustering is formed from the keyqueries within an iterative process. We use the explicit topic model ESA as document retrieval model in order to index the CORE dataset in the reference search engine. Under the ESA retrieval model, documents are represented as vectors of similarities to Wikipedia articles; a methodology proven to be advantageous for text categorization tasks. Our paper presents the generated taxonomy and reports on quantitative properties such as document coverage and processing requirements.}, subject = {Massendaten}, language = {en} } @article{KonichNikitinKlimenkoetal., author = {Konich, Kira and Nikitin, Igor and Klimenko, Stanislav and Malofeev, Valery and Tyul'bashev, Sergey}, title = {Radio Astronomical Monitoring in Virtual Environment}, series = {Procedia Computer Science}, journal = {Procedia Computer Science}, doi = {10.1016/j.procs.2015.11.067}, url = {http://nbn-resolving.de/urn:nbn:de:gbv:wim2-20170425-31431}, pages = {592 -- 601}, abstract = {We present StarWatch, our application for real-time analysis of radio astronomical data in Virtual Environment. Serving as an interface to radio astronomical databases or being applied to live data from the radio telescopes, the application supports various data filters measuring signal-to-noise ratio (SNR), Doppler's drift, degree of signal localization on celestial sphere and other useful tools for signal extraction and classification. Originally designed for the database of narrow band signals from SETI Institute (setilive.org), the application has been recently extended for the detection of wide band periodic signals, necessary for the search of pulsars. We will also address the detection of week signals possessing arbitrary waveforms and present several data filters suitable for this purpose.}, subject = {Virtuelle Realit{\"a}t}, language = {en} }