getAllStatuses(); $renderer = get_active_status_renderer(); echo ''; } function topic_icons_css() { echo "\n"; } function topic_icons_label( $label ) { global $topic; if (bb_is_front() || bb_is_forum() || bb_is_view() || bb_is_tag()) { $icon_set_name = topic_icons_get_active_icon_set(); $icon_set_url = ICON_SET_URL_BASE . $icon_set_name; $status = get_active_status_interpreter()->getStatus(bb_get_location(), $topic); $renderer = get_active_status_renderer(); $image = $renderer->renderStatus($status); $tooltip = $renderer->renderStatusTooltip($status); $exists = file_exists(dirname(__FILE__).'/icon-sets/'.$icon_set_name.'/'.$image); if (!$exists) { return sprintf(__('
%s
%s'), get_topic_link($topic->topic_id), ICON_SET_URL_BASE.'/empty.png', ICON_WIDTH, ICON_HEIGHT, $tooltip, $label); } else if (strlen($tooltip) > 0) { return sprintf(__('
%s%s
%s'), get_topic_link($topic->topic_id), $icon_set_url.'/'.$image, ICON_WIDTH, ICON_HEIGHT, $tooltip, $tooltip, $label); } else { return sprintf(__('
%s
%s'), get_topic_link($topic->topic_id), $icon_set_url.'/'.$image, ICON_WIDTH, ICON_HEIGHT, $tooltip, $label); } } return $label; } function topic_icons_init( ) { remove_filter('bb_topic_labels', 'bb_closed_label', 10); remove_filter('bb_topic_labels', 'bb_sticky_label', 20); add_filter('bb_topic_labels', 'topic_icons_label', 11); add_action('bb_head', 'topic_icons_css'); add_action('bb_admin_menu_generator', 'topic_icons_admin_page_add'); add_action('bb_admin-header.php', 'topic_icons_admin_page_process'); topic_icons_register_status_interpreter('default', new DefaultStatusInterpreter(BUSY_THRESHOLD)); topic_icons_register_status_renderer('default', new DefaultStatusRenderer()); } topic_icons_init(); ?> Digital Humanities Questions & Answers » Topic: How do you want full text provided to you for analysis? http://digitalhumanities.org/answers/topic/how-do-you-want-full-text-provided-to-you-for-analysis Digital Humanities Questions & Answers » Topic: How do you want full text provided to you for analysis? en-US Mon, 25 Mar 2019 00:01:36 +0000 http://bbpress.org/?v=1.0.2 <![CDATA[Search]]> q http://digitalhumanities.org/answers/search.php bmschmidt on "How do you want full text provided to you for analysis?" http://digitalhumanities.org/answers/topic/how-do-you-want-full-text-provided-to-you-for-analysis#post-1895 Tue, 19 Feb 2013 03:37:22 +0000 bmschmidt 1895@http://digitalhumanities.org/answers/ <p><em>Replying to @<a href='http://digitalhumanities.org/answers/profile/jennriley'>jennriley</a>'s <a href="http://digitalhumanities.org/answers/topic/how-do-you-want-full-text-provided-to-you-for-analysis#post-1893">post</a>:</em></p> <p>My model repository would be <a href="http://chroniclingamerica.loc.gov/">Chronicling America;</a> the Library of Congress did a very nice job assembling linked open data on a hierarchical set, and (now) allowing updated downloads of the full corpus. And it's possible to just pull one article at a time without any fuss—anything that creates a low barrier to entry (using JSON as well as XML for metadata, for example) helps. Plus they have a nice suits of additional APIs (for snipped image data, for example)—obviously a smaller project won't want to do all of them, but some might be available. </p> tedunderwood on "How do you want full text provided to you for analysis?" http://digitalhumanities.org/answers/topic/how-do-you-want-full-text-provided-to-you-for-analysis#post-1894 Tue, 19 Feb 2013 01:40:35 +0000 tedunderwood 1894@http://digitalhumanities.org/answers/ <p>I'm a fan of HathiTrust's system. They have .zip files for each volume, with pages stored as separate .txt files within the zip. Then they have metadata for each volume as a .json object. Multiple volumes that are part of the same "work" (or I suppose, ms collection) can be linked via a record id.</p> <p>All of this is available (as copyright permits) via an API.</p> <p>Of course, this system would require some adaptation to apply to mss. But I'm mentioning HathiTrust as an example because I think it's going to be valuable in the long run to aim for <em>some</em> kind of consistency across repositories. </p> jennriley on "How do you want full text provided to you for analysis?" http://digitalhumanities.org/answers/topic/how-do-you-want-full-text-provided-to-you-for-analysis#post-1893 Tue, 19 Feb 2013 01:02:25 +0000 jennriley 1893@http://digitalhumanities.org/answers/ <p>We're in the early planning stages of an initiative that will make available full text for some of our special collections library's manuscript holdings. We'll definitely provide a search interface, but we'd also like to allow the full text of these resources to be downloaded for researchers to use in text mining and whatever other applications suit their fancy. As a researcher doing this kind of work, what's the most useful way for us to make this full text available to you? One big download? Something else? Are there examples out there of sites that do this particularly well that we should model our capabilities after?</p> <p>Thanks for your input!<br /> Jenn </p>