n $r;
}

// 版块版主权限判断: allowtop, allowmove, allowupdate, allowdelete, allowbanuser, allowviewip, allowdeleteuser
function forum_access_mod($fid, $gid, $access)
{
    global $grouplist, $forumlist, $uid;
    
    // 结果缓存，加速判断！
    static $result = array();
    $k = $fid . '-' . $gid . '-' . $access;
    if (isset($result[$k])) return $result[$k];

    if (1 == $gid || 2 == $gid) return TRUE; // 管理员有所有权限
    if (3 == $gid || 4 == $gid) {
        $group = $grouplist[$gid];
        $forum = $forumlist[$fid];
        $r = !empty($group[$access]) && in_string($uid, $forum['moduids']);
    } else {
        $r = FALSE;
    }
    $result[$k] = $r;
    
    return $r;
}

function forum_is_mod($fid, $gid, $uid)
{
    global $grouplist, $forumlist;
    

    if (1 == $gid || 2 == $gid) return TRUE; // 管理员有所有权限
    if (3 == $gid || 4 == $gid) {
        if (0 == $fid) return TRUE; // 此处不严谨！
        $group = $grouplist[$gid];
        $forum = $forumlist[$fid];
        return in_string($uid, $forum['moduids']);
    }
    
    return FALSE;
}

// ------------> 其他方法

function forum_access_format(&$access)
{
    
    if (empty($access)) return;
    
}

function forum_access_count($cond = array())
{
    
    $n = db_count('forum_access', $cond);
    
    return $n;
}




?>  !empty($attach) and attach_big_insert($attach);

    

    $attachlist = $imagelist = $filelist = '';
    $images = 0;
    $files = 0;
    // 处理不在 message 中的图片，删除掉没有插入的附件
    if ($message) {
        // 只有评论会传pid
        list($attachlist, $imagelist, $filelist) = $pid ? well_attach_find_by_pid($pid) : well_attach_find_by_tid($tid);

        

        if (!empty($imagelist)) {
            $aids = array();
            foreach ($imagelist as $key => $attach) {

                $image_url = $conf['upload_url'] . 'website_attach/' . $attach['filename'];

                

                if (FALSE === strpos($message, $image_url)) {

                    unset($attachlist[$attach['aid']], $imagelist[$attach['aid']]);

                    $aids[] = $attach['aid'];

                    $path = $conf['upload_path'] . 'website_attach/' . $attach['filename'];
                    is_file($path) and unlink($path);

                    

                    // 删除云储存文件
                }

                
            }

            !empty($aids) and well_attach__delete($aids);

            
        }

        $images = count($imagelist);
        $files = count($filelist);

        
    }

    

    $return += array('tid' => $tid, 'pid' => $pid, 'icon' => $icon, 'message' => $message, 'images' => $images, 'files' => $files);

    

    return $return;
}

// 关联内容中的文件，逐渐放弃使用该函数，使用 well_attach_assoc_handle()
function well_attach_assoc_file($arr = array())
{
    global $conf, $time;

    

    $uid = array_value($arr, 'uid', 0);
    $tid = array_value($arr, 'tid', 0);
    $post_create = array_value($arr, 'post_create', 0); // 创建回复
    $pid = array_value($arr, 'pid', 0);
    $images = array_value($arr, 'images', 0);
    $files = array_value($arr, 'files', 0);
    $message = array_value($arr, 'message');

    if (!$tid && !$pid) return $message;

    

    $attach_dir_save_rule = array_value($conf, 'attach_dir_save_rule', 'Ym');
    $day = date($attach_dir_save_rule, $time);
    $path = $conf['upload_path'] . 'website_attach/' . $day;
    $url = $conf['upload_url'] . 'website_attach/' . $day;
    is_dir($path) || mkdir($path, 0777, TRUE);

    if (!empty($arr['sess_tmp_files'])) {

        $message = urldecode($message);
        preg_match_all('#<img[^>]+src="(.*?)"#i', $message, $match);

        $localurlarr = array(
            'http://' . $_SERVER['SERVER_NAME'] . '/',
            'https://' . $_SERVER['SERVER_NAME'] . '/',
        );

        // 跳过云储存
        $conf['cloud_url'] and $localurlarr[] = $conf['cloud_url'];

        

        /*$match[1]
            Array
            (
                [0] => https://nimg.ws.126.net/?url=http://dingyue.ws.126.net/2021/1109/d3321a58j00r29xq20013c000hk00h4g.jpg&thumbnail=650x2147483647&quality=80&type=jpg
                [1] => https://nimg.ws.126.net/?url=http://dingyue.ws.126.net/2021/1109/e4974b87j00r29xq30013c000fi00i3g.jpg&thumbnail=650x2147483647&quality=80&type=jpg
                [2] => upload/tmp/1_KAUXKFMJHFTUMNS.jpg
                [3] => https://nimg.ws.126.net/?url=http://dingyue.ws.126.net/2021/1109/5a7be552j00r29xq3001qc000hs00hvg.jpg&thumbnail=650x2147483647&quality=80&type=jpg
            )*/
        $upload_arr = array();
        $http_arr = array();
        if (!empty($match[1])) {
            foreach ($match[1] as $_url) {

                foreach ($localurlarr as $localurl) {
                    if ($localurl == substr($_url, 0, strlen($localurl))) continue 2;
                }

                if (substr($_url, 0, 7) == 'http://' || substr($_url, 0, 8) == 'https://') {
                    $http_arr[] = $_url;
                } elseif (substr($_url, 0, 11) == 'upload/tmp/' || substr($_url, 0, 12) == '/upload/tmp/' || substr($_url, 0, 14) == '../upload/tmp/') {
                    $upload_arr[] = $_url;
                }
            }
        }

        

        $attach = array();
        foreach ($arr['sess_tmp_files'] as $file) {

            // 过滤非内容图，不包括附件
            if (!in_array($file['url'], $upload_arr) && 0 != $file['isimage']) {
                unlink($file['path']);
                continue;
            }

            

            // 后台提交的内容需要替换掉../
            $file['url'] = $file['backstage'] ? str_replace('../upload/', 'upload/', $file['url']) : str_replace('/upload/', 'upload/', $file['url']);

            

            // 内容附件 将文件移动到 upload/website_attach 目录
            $filename = file_name($file['url']);

            

            // 绝对路径
            $destfile = $path . '/' . $filename;
            // 相对路径
            $desturl = $url . '/' . $filename;
            // 复制
            xn_copy($file['path'], $destfile) || xn_log("xn_copy($file[path]), $destfile) failed, tid:$tid, pid:$pid", 'php_error');

            

            if (is_file($destfile) && filesize($destfile) == filesize($file['path'])) unlink($file['path']);

            // 按照$destfile文件路径，上传至云储存或图床，返回数据.附件分离，最优方案是redis队列，单独写上传云储存php文件，nohup后台运行，将队列数据上传云储存，然后根据aid更新附件表attach_on、image_url自动，根据tid更新主题表attach_on。关联附件上传云储存，有可能导致超时。

            

            $attacharr = array(
                /*'tid' => $tid,
                'pid' => $pid,*/
                'uid' => $uid,
                'filesize' => $file['filesize'],
                'width' => $file['width'],
                'height' => $file['height'],
                'filename' => $day . '/' . $filename,
                'orgfilename' => $file['orgfilename'],
                //'image_url' => '', // 图床文件完整网址
                'filetype' => $file['filetype'],
                'create_date' => $time,
                'isimage' => $file['isimage']
            );

            $tid and $attacharr += $pid ? array('pid' => $pid) : array('tid' => $tid);

            

            $attach[] = $attacharr;

            // 关联内容再入库
            //$aid = well_attach_create($attach);

            $file['backstage'] and $message = str_replace('../upload/', 'upload/', $message);
            $message = str_replace($file['url'], $desturl, $message);

            
        }

        !empty($attach) and attach_big_insert($attach);

        

        // 清空 session
        $_SESSION['tmp_website_files'] = array();
    }

    

    // 更新附件数
    $update = array();
    $_images = 0;
    $_files = 0;
    // 处理不在 message 中的图片，删除掉没有插入的图片附件
    if ($message) {

        // 只有评论会传pid
        list($attachlist, $imagelist, $filelist) = $pid ? well_attach_find_by_pid($pid) : well_attach_find_by_tid($tid);

        

        if (!empty($imagelist)) {
            $aids = array();
            foreach ($imagelist as $key => $attach) {

                $url = $conf['upload_url'] . 'website_attach/' . $attach['filename'];

                

                if (FALSE === strpos($message, $url)) {
                    unset($attachlist[$attach['aid']], $imagelist[$attach['aid']]);

                    $aids[] = $attach['aid'];

                    $path = $conf['upload_path'] . 'website_attach/' . $attach['filename'];
                    is_file($path) and unlink($path);

                    

                    // 删除云储存文件
                }

                
            }

            !empty($aids) and well_attach__delete($aids);

            
        }

        $_images = count($imagelist);
        $images != $_images and $update['images'] = $_images;

        $_files = count($filelist);
        $files != $_files and $update['files'] = $_files;

        
    }

    

    if (empty($update)) return $pid ? array($message, $_images, $_files) : $message;

    if ($pid) {
        if ($post_create) {
            $update['message'] = $message;
            comment__update($pid, $update);
        } else {
            // 编辑回复返回的数据
            return array($message, $_images, $_files);
        }
    } else {
        well_thread_update($tid, $update);
    }

    

    return $message;
}

// thumbnail:主题主图 post:内容图片或附件
function well_attach_assoc_type($type)
{
    
    switch ($type) {
        case 'thumbnail':
            $k = 'tmp_thumbnail';
            break;
        case 'post':
            $k = 'tmp_website_files';
            break;
        
        default:
            return NULL;
            break;
    }
    $sess_tmp_files = _SESSION($k);
    // 如果session中没有，从数据库中获取储存的session
    //if (empty($sess_tmp_files) && preg_match('#' . $k . '\|(a\:1\:\{.*\})#', _SESSION('data'), $matches)) $sess_tmp_files = unserialize(str_replace(array('+', '='), array('_', '.'), $matches['1']));
    
    return $sess_tmp_files;
}

// Create thumbnail
function well_attach_create_thumbnail($arr)
{
    global $conf, $time, $forumlist, $config;

    $uid = array_value($arr, 'uid', 0);
    $tid = array_value($arr, 'tid', 0);
    $fid = array_value($arr, 'fid', 0);
    $forum = array_value($forumlist, $fid);

    $picture = $config['picture_size'];
    $picture = isset($forum['thumbnail']) ? $forum['thumbnail'] : $picture['picture_size'];
    $pic_width = $picture['width'];
    $pic_height = $picture['height'];

    $attachlist = well_attach_assoc_type('post');
    if (empty($attachlist)) return;

    $attach_dir_save_rule = array_value($conf, 'attach_dir_save_rule', 'Ym');

    $day = date($attach_dir_save_rule, $time);
    $path = $conf['upload_path'] . 'thumbnail/' . $day;
    is_dir($path) || mkdir($path, 0777, TRUE);

    $tmp_file = $conf['upload_path'] . 'tmp/' . $uid . '_' . $tid . '_' . $time . '.jpeg';

    $i = 0;
    foreach ($attachlist as $val) {
        ++$i;
        if (1 == $val['isimage'] && 1 == $i) {
            'clip' == array_value($conf, 'upload_resize', 'clip') ? well_image_clip_thumb($val['path'], $tmp_file, $pic_width, $pic_height) : well_image_thumb($val['path'], $tmp_file, $pic_width, $pic_height);
            break;
        }
    }
    $destfile = $path . '/' . $uid . '_' . $tid . '_' . $time . '.jpeg';
    xn_copy($tmp_file, $destfile) || xn_log("xn_copy($tmp_file), $destfile) failed, tid:$tid", 'php_error');
}

function well_save_remote_image($arr)
{
    global $conf, $time, $forumlist, $config;

    

    $message = array_value($arr, 'message');
    $tid = array_value($arr, 'tid', 0);
    $fid = array_value($arr, 'fid', 0);
    $uid = array_value($arr, 'uid', 0);
    $thumbnail = array_value($arr, 'thumbnail', 0);
    $save_image = array_value($arr, 'save_image', 0);

    $attach_dir_save_rule = array_value($conf, 'attach_dir_save_rule', 'Ym');

    $day = date($attach_dir_save_rule, $time);
    $attach_dir = $conf['upload_path'] . 'website_attach/' . $day . '/';
    $attach_url = $conf['upload_url'] . 'website_attach/' . $day . '/';
    is_dir($attach_dir) || mkdir($attach_dir, 0777, TRUE);

    

    if ($thumbnail) {

        $picture = $config['picture_size'];
        $forum = array_value($forumlist, $fid);
        $picture = isset($forum['thumbnail']) ? $forum['thumbnail'] : $picture['picture_size'];
        $pic_width = $picture['width'];
        $pic_height = $picture['height'];

        $thumbnail_path = $conf['upload_path'] . 'thumbnail/' . $day . '/';
        is_dir($thumbnail_path) || mkdir($thumbnail_path, 0777, TRUE);

        $tmp_file = $thumbnail_path . $uid . '_' . $tid . '_' . $time . '.jpeg';
    }

    $localurlarr = array(
        'http://' . $_SERVER['SERVER_NAME'] . '/',
        'https://' . $_SERVER['SERVER_NAME'] . '/',
    );
    // 跳过云储存
    $conf['cloud_url'] and $localurlarr[] = $conf['cloud_url'];

    

    //$save_image_quality = array_value($conf, 'save_image_quality', 0);
    $save_image_quality = 0;

    $message = urldecode($message);
    //$message = str_replace('&amp;', '&', $message);
    //$message = htmlspecialchars_decode($message);
    preg_match_all('#<img[^>]+src="(http.*?)"#i', $message, $match);

    

    if (!empty($match[1])) {
        $n = 0;
        $i = 0;
        foreach ($match[1] as $url) {

            foreach ($localurlarr as $localurl) {
                if ($localurl == substr($url, 0, strlen($localurl))) continue 2;
            }

            $full_url = htmlspecialchars_decode($url);
            $message = str_replace($url, $full_url, $message);
            $getimgsize = getimagesize($full_url);
            if (FALSE === $getimgsize) continue; // 非图片跳出

            $filename = $uid . '_' . xn_rand(16);
            if (1 == $getimgsize[2]) {
                $filename .= '.gif';
                $destpath = $attach_dir . $filename;
            } elseif (in_array($getimgsize[2], array(2, 3, 15, 18))) {
                $filename .= '.jpeg';
                $destpath = $attach_dir . $filename;
            } else {
                continue; // 非常见图片格式跳出
            }

            $desturl = $attach_url . $filename;
            $_message = str_replace($full_url, $desturl, $message);

            if ($message != $_message) {

                if ($save_image) {
                    if (0 == $save_image_quality) {
                        $imgdata = https_request($full_url);
                        //$destpath = $attach_dir . $filename;
                        file_put_contents_try($destpath, $imgdata);
                    } else {
                        // 图片压缩 GD 库效率低下 ImageMagick 需要额外安装扩展
                        switch ($getimgsize[2]) {
                            case 1: // GIF
                                $imgdata = imagecreatefromgif($full_url);
                                break;
                            case 2: // JPG
                                $imgdata = imagecreatefromjpeg($full_url);
                                break;
                            case 3: // PNG
                                $imgdata = imagecreatefrompng($full_url);
                                break;
                            case 15: // WBMP
                                $imgdata = imagecreatefromwbmp($full_url);
                                break;
                            case 18: // WEBP
                                $imgdata = imagecreatefromwebp($full_url);
                                break;
                        }
                        imagejpeg($imgdata, $destpath, $save_image_quality);
                        imagedestroy($imgdata);
                    }
                }

                // 创建缩略图
                if ($thumbnail) {

                    if (1 == ++$i) {

                        if (empty($save_image)) {
                            $imgdata = https_request($full_url);
                            file_put_contents_try($destpath, $imgdata);
                        }

                        // 裁切保存到缩略图目录
                        'clip' == array_value($conf, 'upload_resize', 'clip') ? well_image_clip_thumb($destpath, $tmp_file, $pic_width, $pic_height, $getimgsize) : well_image_thumb($destpath, $tmp_file, $pic_width, $pic_height, $getimgsize);
                        well_thread_update($tid, array('icon' => $time));
                    }

                    if (empty($save_image)) {
                        is_file($destpath) and unlink($destpath);
                        continue;
                    }
                }

                $filesize = strlen($imgdata);
                $attach = array('tid' => $tid, 'uid' => $uid, 'filesize' => $filesize, 'width' => $getimgsize[0], 'height' => $getimgsize[1], 'filename' => "$day/$filename", 'orgfilename' => $filename, 'filetype' => 'image', 'create_date' => $time, 'downloads' => 0, 'isimage' => 1);
                $aid = well_attach_create($attach);
                $n++;
            }

            $message = preg_replace('#(<img.*?)(class=.+?[\'|\"])|(data-src=.+?[\'|"])|(data-type=.+?[\'|"])|(data-ratio=.+?[\'|"])|(data-s=.+?[\'|"])|(data-fail=.+?[\'|"])|(crossorigin=.+?[\'|"])|((data-w)=[\'"]+[0-9]+[\'"]+)|(_width=.+?[\'|"]+)|(_height=.+?[\'|"]+)|(style=.+?[\'|"])|((width)=[\'"]+[0-9]+[\'"]+)|((height)=[\'"]+[0-9]+[\'"]+)#i', '$1', $_message);
        }
        
        $n and well_thread_update($tid, array('images+' => $n));
    }

    
    return $message;
}

function well_get_image_url($url)
{
    if ($n = strpos($url, '.jpg')) {
        $_n = $n + 4;
    } elseif ($n = strpos($url, '.jpeg')) {
        $_n = $n + 5;
    } elseif ($n = strpos($url, '.png')) {
        $_n = $n + 4;
    } elseif ($n = strpos($url, '.gif')) {
        $_n = $n + 4;
    } elseif ($n = strpos($url, '.bmp')) {
        $_n = $n + 4;
    }

    $url = $n ? mb_substr($url, 0, $_n, 'UTF-8') : NULL;

    return $url;
}




?>     // 频道和全局置顶主题
        foreach ($arrlist as $val) {
            if (in_array($val['fid'], $fids) && 2 == $val['sticky']) {
                $sticky2[$val['tid']] = $val;
            } elseif (3 == $val['sticky']) {
                $sticky3[$val['tid']] = $val;
            }
        }
    } else {
        // 栏目/上级频道/全局置顶
        foreach ($arrlist as $val) {
            if ($forum['fid'] == $val['fid'] && 1 == $val['sticky']) {
                $sticky1[$val['tid']] = $val;
            } elseif (in_array($val['fid'], $fids) && 2 == $val['sticky']) {
                $sticky2[$val['tid']] = $val;
            } elseif (3 == $val['sticky']) {
                $sticky3[$val['tid']] = $val;
            }
        }
    }

    $sticky3 = empty($sticky3) ? array() : array_multisort_key($sticky3, 'create_date', FALSE, 'tid');
    $sticky2 = empty($sticky2) ? array() : array_multisort_key($sticky2, 'create_date', FALSE, 'tid');
    $sticky1 = empty($sticky1) ? array() : array_multisort_key($sticky1, 'create_date', FALSE, 'tid');

    $arr = $sticky3 + $sticky2 + $sticky1;

    

    return $arr;
}

// 全部置顶缓存
function sticky_thread_find_cache()
{
    global $conf;

    

    $key = 'sticky_thread_list';
    static $cache = array(); // 用静态变量只能在当前 request 生命周期缓存，跨进程需要再加一层缓存：redis/memcached/xcache/apc
    if (isset($cache[$key])) return $cache[$key];

    

    if ('mysql' == $conf['cache']['type']) {
        $arr = sticky_thread__find(array(), array('tid' => -1), 1, 2000);
    } else {
        $arr = cache_get($key);
        if (NULL === $arr) {
            $arr = sticky_thread__find(array(), array('tid' => -1), 1, 2000);
            $arr AND cache_set($key, $arr, 1800);
        }
    }

    

    $cache[$key] = $arr ? $arr : NULL;

    

    return $cache[$key];
}




?><!DOCTYPE html><html lang="zh-cn"><head><meta http-equiv="Content-Type" content="text/html; charset=utf-8" /><meta http-equiv="X-UA-Compatible" content="IE=Edge,chrome=1" /><meta http-equiv="Cache-Control" content="no-transform" /><meta http-equiv="Cache-Control" content="no-siteapp" /><meta name="viewport"
          content="width=device-width, initial-scale=1.0, minimum-scale=1.0, maximum-scale=1.0, user-scalable=no"><meta name="referrer" content="origin-when-cross-origin"><meta name="applicable-device" content="pc,mobile" /><meta name="MobileOptimized" content="width" /><meta name="HandheldFriendly" content="true" /><meta name="renderer" content="webkit" /><meta name="keywords" content="数据,处理,文本" /><meta name="description" content="mapreduce sequencefileinputformat使用" /><title>mapreduce sequencefileinputformat使用编程频道|福州电脑网
</title><link rel="shortcut icon" href="/view/img/favicon.ico" /><link rel="icon" sizes="32x32" href="/view/img/favicon.ico"><link rel="Bookmark" href="/view/img/favicon.ico" /><link rel="stylesheet" href="/view/template/mitiqin/css/style.css?2.3.0"><link rel="stylesheet" href="/view/template/mitiqin/css/iconfont.css?2.3.0"><script src="/view/template/mitiqin/js/jquery-2.2.4.min.js?2.3.0" type="text/javascript"></script></head><body><div id="header"><div class="header container"><div class="logo"><a href="/"  title="福州电脑网_福州电脑维修_福州电脑之家_福州iThome"><img src="/view/template/mitiqin/img/logo.png" alt="福州电脑网_福州电脑维修_福州电脑之家_福州iThome"></a></div><div id="monavber" class="nav" data-type="index" data-infoid><ul id="nav" class="navbar"><li class="navbar-item" data-active="fid-0"><a href="/">首页</a></li><li class="navbar-item" fid="5" data-active="fid-5"><a href="/biancheng">编程之家</a></li><li class="navbar-item" fid="4" data-active="fid-4"><a href="/xitong">系统教程</a></li><li class="navbar-item" fid="12" data-active="fid-12"><a href="/shuma">数码周边</a></li><li class="navbar-item" fid="13" data-active="fid-13"><a href="/pc">电脑</a></li></ul></div><div id="mnav"><i class="iconfont icon-app"></i></div><div id="search"><i class="iconfont icon-search"></i></div><div class="search"><form id="form-search" action="/operate/search.html"><input type="text" name="keyword" placeholder="关键词" value=""/><button type="submit" value="搜索"><i class="iconfont icon-search"></i></button><input type="hidden" name="range" value="1"></form></div></div></div>
<div class="fzithome-com breadcrumb2 container-w"><div id="b" class="cl"><div class="fzithome-com fl"><i class="iconfont icon-home"></i><a href="/">首页</a>&nbsp;>&nbsp;
<a href="/xitong">系统教程</a><a href="/xitong/1708962415a282412.html" title="首页">mapreduce sequencefileinputformat使用</a></div></div></div><div class="fzithome-com main container-w cl"><div class="fzithome-com mainl"><div class="fzithome-com art-post"><div class="fzithome-com title"><h1>mapreduce sequencefileinputformat使用</h1><div class="fzithome-com info"><span><a href="/xitong"><i class="iconfont icon-crossborder-fill"></i>系统教程</a></span><span><i class="iconfont icon-browse"></i>91</span><span><i class="iconfont icon-message-fill"></i>0</span><span>
                        更新时间：2026-04-06 12:46:09</span></div></div><div class="fzithome-com art-content"><article class="single-post"><div class="fzithome-com entry"><p>2024年2月26日发(作者：)</p><p><h2></h2></p><p></img></p><p style="text-indent: 2em;";></p><p style="text-indent: 2em;";>mapreduce sequencefileinputformat使用 </p><p style="text-indent: 2em;";>【实用版】 </p><p style="text-indent: 2em;";>目录 </p><p style="text-indent: 2em;";>uce 概述   </p><p style="text-indent: 2em;";>ceFile 概述   </p><p style="text-indent: 2em;";>uce SequenceFileInputFormat 的使用方法   </p><p style="text-indent: 2em;";>4.实际应用示例 </p><p style="text-indent: 2em;";>正文 </p><p style="text-indent: 2em;";>一、MapReduce 概述   </p><p style="text-indent: 2em;";>MapReduce 是一种编程模型，用于大规模数据处理。它包含两个操作：Map 和 Reduce。Map 操作对输入数据进行切分和处理，将数据分为多个片段。Reduce 操作对 Map 操作产生的数据进行整合和处理，最终生成输出结果。MapReduce 广泛应用于分布式计算环境中，如 Hadoop。 </p><p style="text-indent: 2em;";>二、SequenceFile 概述   </p><p style="text-indent: 2em;";>SequenceFile 是一种二进制文件格式，用于存储大规模数据。它由多个数据块组成，每个数据块包含一个记录。SequenceFile 支持多种数据类型，如文本、整数、浮点数等。SequenceFile 在 Hadoop 生态系统中被广泛使用，因为它具有高效的读写性能和便于存储和传输的特点。 </p><p style="text-indent: 2em;";>三、MapReduce SequenceFileInputFormat 的使用方法   </p><p style="text-indent: 2em;";>MapReduce SequenceFileInputFormat 是 Hadoop 提供的一个类，用于处理 SequenceFile 格式的输入数据。它继承自 InputFormat 接口，并实现了对 SequenceFile 的读取功能。使用 MapReduce </p><p style="text-indent: 2em;";>SequenceFileInputFormat 的方法如下： </p><p style="text-indent: 2em;";>1.创建一个实现 InputFormat 接口的类，如 MyInputFormat。   </p><p style="text-indent: 2em;";> </p><p style="text-indent: 2em;";>第 1 页 共 2 页 </p><p style="text-indent: 2em;";>2.在 MyInputFormat 类中，实现 InputFormat 接口的 getInput </p><p style="text-indent: 2em;";>方法，返回一个 SequenceFile 路径。   </p><p style="text-indent: 2em;";>3.在 MyInputFormat 类中，实现 InputFormat 接口的 </p><p style="text-indent: 2em;";>getRecordReader 方法，返回一个 SequenceFileRecordReader 对象。   </p><p style="text-indent: 2em;";>4.在 MyInputFormat 类中，实现 InputFormat 接口的 getSplit </p><p style="text-indent: 2em;";>方法，返回一个 SequenceFileSplit 对象。   </p><p style="text-indent: 2em;";>5.在 MyInputFormat 类中，实现 InputFormat 接口的 </p><p style="text-indent: 2em;";>isSplitable 方法，返回 true，使 SequenceFile 支持切分。 </p><p style="text-indent: 2em;";>四、实际应用示例   </p><p style="text-indent: 2em;";>假设我们有一个处理文本数据的任务，需要对文本数据进行分词处理。我们可以使用 MapReduce SequenceFileInputFormat 来完成这个任务。具体步骤如下： </p><p style="text-indent: 2em;";>1.创建一个名为 MyInputFormat 的类，实现 InputFormat 接口的 </p><p style="text-indent: 2em;";>getInput、getRecordReader、getSplit 和 isSplitable 方法。   </p><p style="text-indent: 2em;";>2.在 MyInputFormat 类中，实现对 SequenceFile 的读取功能，将文本数据切分为单词。   </p><p style="text-indent: 2em;";>3.创建一个名为 MyMapper 的类，继承自 Mapper 接口，实现 map </p><p style="text-indent: 2em;";>方法，对文本数据进行分词处理。   </p><p style="text-indent: 2em;";>4.创建一个名为 MyReducer 的类，继承自 Reducer 接口，实现 </p><p style="text-indent: 2em;";>reduce 方法，对分词后的数据进行整合。   </p><p style="text-indent: 2em;";>5.在 Hadoop 中提交任务，使用 MyInputFormat、MyMapper 和 </p><p style="text-indent: 2em;";>MyReducer 类，并将输出结果写入 HDFS。 </p><p style="text-indent: 2em;";> </p><p style="text-indent: 2em;";> </p><p style="text-indent: 2em;";>第 2 页 共 2 页 </p><p><p><h2></h2></p></img></p></div></article></div><div class="fzithome-com info"><div><span>本文发布于:2024-02-26，感谢您对本站的认可！</span></div><div><span>本文链接:</span><a href="https://www.fzithome.com/xitong/1708962415a282412.html" title="mapreduce sequencefileinputformat使用">https://www.fzithome.com/xitong/1708962415a282412.html</a></div><div><span>版权声明:本站内容均来自互联网，仅供演示用，请勿用于商业和其他非法用途。如果侵犯了您的权益请与我们联系，我们将在24小时内删除。</span></div></div><span class="tag"><i class="iconfont icon-discount" style="font-size:12px;font-weight:bold;opacity:.7;">本文标签：</i><a href="/tag/235.html" target="_blank">数据</a><a href="/tag/449.html" target="_blank">处理</a><a href="/tag/597.html" target="_blank">文本</a></span></div><div class="fzithome-com post_comments" id="comments"><div id="comt-respond" class="commentpost"><h4>发布评论
<span><a rel="nofollow" id="cancel-reply" href="#comment" style="display:none;"><small>取消回复</small></a></span></h4><form action="/comment/create/282412.html?safe_token=PAYLvr8VHc4OHiSaOKzY7VdVb8f9Sw6iqNmIig5WW_2FQZwBUY6P_2BiER2wtrxHdlaUCDFU7zpI7XWJa76SMdwU6A_3D_3D" method="post" name="saypl" id="frmSumbit"><input type="hidden" name="doctype" value="1" /><input type="hidden" name="quotepid" value="0" /><div id="comment-tools"><div class="fzithome-com tools_text"><textarea placeholder="请在这里留言..." name="message" id="txaArticle" class="text input-block-level comt-area" cols="50" rows="4" tabindex="5"></textarea></div></div><div class="fzithome-com psumbit"><input name="sumbit" type="submit" tabindex="6" value="发布" class="button" /></div></form></div><div class="fzithome-com commentlist"><div class="fzithome-com comment-tab"><div class="fzithome-com come-comt">评论列表<span id="comment_count">（有<span id="infocommentnumarea" style="color:#c81111">0</span>条评论）</span></div></div><ul class="diy-comment"></ul></div></div></div><div class="fzithome-com mainr"><div class="widget widget_previous"><h4 class="bar">最近发表</h4><ul><li><a href="/xitong/1700736940a5.html"title='打开mdb数据库_PyTorch60.读写LMDB数据库' aria-label='打开mdb数据库_PyTorch60.读写LMDB数据库'>打开mdb数据库_PyTorch60.读写LMDB数据库</a></li><li><a href="/xitong/1700737632a39.html"title='mdb文件取消隐藏_如何关闭Windows10系统盘中的休眠文件可以节省空间' aria-label='mdb文件取消隐藏_如何关闭Windows10系统盘中的休眠文件可以节省空间'>mdb文件取消隐藏_如何关闭Windows10系统盘中的休眠文件可以节省空间</a></li><li><a href="/xitong/1700738253a67.html"title='DVE用户手册' aria-label='DVE用户手册'>DVE用户手册</a></li><li><a href="/xitong/1700739575a124.html"title='VB程序中用ADO对象动态创建数据库和表' aria-label='VB程序中用ADO对象动态创建数据库和表'>VB程序中用ADO对象动态创建数据库和表</a></li><li><a href="/xitong/1700741804a224.html"title='高中信息技术会考数据库模块操作题题库' aria-label='高中信息技术会考数据库模块操作题题库'>高中信息技术会考数据库模块操作题题库</a></li><li><a href="/xitong/1700742603a259.html"title='高中信息技术学考ACCESS操作题练习' aria-label='高中信息技术学考ACCESS操作题练习'>高中信息技术学考ACCESS操作题练习</a></li><li><a href="/xitong/1700752349a732.html"title='中国第一部特许经营法规引发热点关注' aria-label='中国第一部特许经营法规引发热点关注'>中国第一部特许经营法规引发热点关注</a></li><li><a href="/xitong/1700753098a771.html"title='网络新闻' aria-label='网络新闻'>网络新闻</a></li><li><a href="/xitong/1700759581a1082.html"title='惠普电脑一键还原备份的方法步骤' aria-label='惠普电脑一键还原备份的方法步骤'>惠普电脑一键还原备份的方法步骤</a></li><li><a href="/xitong/1700759669a1087.html"title='一键还原的使用' aria-label='一键还原的使用'>一键还原的使用</a></li><li><a href="/xitong/1700759910a1100.html"title='一键还原系统操作说明maxdos迈思' aria-label='一键还原系统操作说明maxdos迈思'>一键还原系统操作说明maxdos迈思</a></li><li><a href="/xitong/1700760281a1120.html"title='手机ADB备份及RECOVERY下备份' aria-label='手机ADB备份及RECOVERY下备份'>手机ADB备份及RECOVERY下备份</a></li><li><a href="/xitong/1700760334a1123.html"title='一键Ghost' aria-label='一键Ghost'>一键Ghost</a></li><li><a href="/xitong/1700761088a1164.html"title='还很浪费时间 今天我把如何安装系统知识做一解释 希望大家能够学_百' aria-label='还很浪费时间 今天我把如何安装系统知识做一解释 希望大家能够学_百'>还很浪费时间 今天我把如何安装系统知识做一解释 希望大家能够学_百</a></li><li><a href="/xitong/1700761471a1184.html"title='操作系统重新安装和一键还原软件使用图解说明' aria-label='操作系统重新安装和一键还原软件使用图解说明'>操作系统重新安装和一键还原软件使用图解说明</a></li><li><a href="/xitong/1700764048a1326.html"title='解决电脑风扇转速过快的问题' aria-label='解决电脑风扇转速过快的问题'>解决电脑风扇转速过快的问题</a></li><li><a href="/xitong/1700764603a1358.html"title='最新CPU智能风扇转速控制Smart' aria-label='最新CPU智能风扇转速控制Smart'>最新CPU智能风扇转速控制Smart</a></li><li><a href="/xitong/1700766685a1476.html"title='华硕电脑经常自动重启怎么回事' aria-label='华硕电脑经常自动重启怎么回事'>华硕电脑经常自动重启怎么回事</a></li><li><a href="/xitong/1700768206a1562.html"title='风扇调速电阻利弊分析' aria-label='风扇调速电阻利弊分析'>风扇调速电阻利弊分析</a></li><li><a href="/xitong/1700768513a1580.html"title='风扇调速电路原理' aria-label='风扇调速电路原理'>风扇调速电路原理</a></li></ul></div><section id="aside_about" class="widget widget_aside_about sb br mb"><div class="avatar"><img class="img" src="/view/template/mitiqin/img/tx.jpg"
             alt="福州电脑网_福州电脑维修_福州电脑之家_福州iThome"/></div><div class="wrap pd"><p class="title">福州电脑网_福州电脑维修_福州电脑之家_福州iThome</p><p class="info">福州电脑维修网(fzithome.com)专业的电脑维修,笔记本维修,上门维修各种电脑,笔记本,平板等,快速上门.电脑知识频道内容覆盖:计算机资讯,电脑基础应用知识,各种电脑故障维修学习,电脑外设产品维修维护,病毒，软件,硬件,常识.</p><ul class="ul clearfix"></ul></div></section><div class="fzithome-com clear"></div><div class="fzithome-com widgets"><h4 class="bar">相关推荐</h4><div class="fzithome-com hot-post"><ul class="clearfix"><li><a href="/xitong/1771567676a2687742.html"title='拯救RAW：深度解析文件系统转变与修复技术' aria-label='拯救RAW：深度解析文件系统转变与修复技术'><span class="sptit">拯救RAW：深度解析文件系统转变与修复技术</span></a></li><li><a href="/xitong/1771673054a2688920.html"title='掌握Adobe Flash Player，给重要资料加层神秘面纱——文件夹加密大法' aria-label='掌握Adobe Flash Player，给重要资料加层神秘面纱——文件夹加密大法'><span class="sptit">掌握Adobe Flash Player，给重要资料加层神秘面纱——文件夹加密大法</span></a></li><li><a href="/xitong/1771806457a2690419.html"title='从物理层到应用层：PCI技术在嵌入式系统中的奇妙旅程' aria-label='从物理层到应用层：PCI技术在嵌入式系统中的奇妙旅程'><span class="sptit">从物理层到应用层：PCI技术在嵌入式系统中的奇妙旅程</span></a></li><li><a href="/biancheng/1771807457a2690429.html"title='轻松实现！iPad mini2的10.3.3版本刷机降级教程' aria-label='轻松实现！iPad mini2的10.3.3版本刷机降级教程'><span class="sptit">轻松实现！iPad mini2的10.3.3版本刷机降级教程</span></a></li><li><a href="/xitong/1771859003a2691007.html"title='游戏、视频流畅度大升级：如何选择开启或不开启CPU访问显存加速？' aria-label='游戏、视频流畅度大升级：如何选择开启或不开启CPU访问显存加速？'><span class="sptit">游戏、视频流畅度大升级：如何选择开启或不开启CPU访问显存加速？</span></a></li><li><a href="/biancheng/1771987623a2691496.html"title='打造疾速SSD：从4K对齐开始' aria-label='打造疾速SSD：从4K对齐开始'><span class="sptit">打造疾速SSD：从4K对齐开始</span></a></li><li><a href="/xitong/1772001437a2691648.html"title='回收站清理了还有一线希望吗？10天内被干掉的文件别放弃！' aria-label='回收站清理了还有一线希望吗？10天内被干掉的文件别放弃！'><span class="sptit">回收站清理了还有一线希望吗？10天内被干掉的文件别放弃！</span></a></li><li><a href="/biancheng/1772042222a2692111.html"title='深入浅出：Hex文件解析与Bin文件互换秘籍' aria-label='深入浅出：Hex文件解析与Bin文件互换秘籍'><span class="sptit">深入浅出：Hex文件解析与Bin文件互换秘籍</span></a></li><li><a href="/biancheng/1772129472a2693107.html"title='动手实践：掌握Python里temp变量背后的奥秘' aria-label='动手实践：掌握Python里temp变量背后的奥秘'><span class="sptit">动手实践：掌握Python里temp变量背后的奥秘</span></a></li><li><a href="/xitong/1772305016a2695082.html"title='数据库大神必学：一主两从模式下的MySQL高可用策略' aria-label='数据库大神必学：一主两从模式下的MySQL高可用策略'><span class="sptit">数据库大神必学：一主两从模式下的MySQL高可用策略</span></a></li><li><a href="/biancheng/1772414575a2696321.html"title='NRG文件挑战解码：完整步骤解析与实操方法' aria-label='NRG文件挑战解码：完整步骤解析与实操方法'><span class="sptit">NRG文件挑战解码：完整步骤解析与实操方法</span></a></li><li><a href="/xitong/1772425423a2696440.html"title='Excel小白必看：XlFileFormat与文件扩展名_excel的完美配对指南' aria-label='Excel小白必看：XlFileFormat与文件扩展名_excel的完美配对指南'><span class="sptit">Excel小白必看：XlFileFormat与文件扩展名_excel的完美配对指南</span></a></li><li><a href="/biancheng/1772473790a2696965.html"title='深度解析：在Web开发领域，Document.execCommand和Clipboard API的异同在哪里？' aria-label='深度解析：在Web开发领域，Document.execCommand和Clipboard API的异同在哪里？'><span class="sptit">深度解析：在Web开发领域，Document.execCommand和Clipboard API的异同在哪里？</span></a></li><li><a href="/xitong/1772474480a2696974.html"title='轻松搞定：Windows剪贴板与clipbrd工具的全方位攻略，帮你快速提升工作效率！' aria-label='轻松搞定：Windows剪贴板与clipbrd工具的全方位攻略，帮你快速提升工作效率！'><span class="sptit">轻松搞定：Windows剪贴板与clipbrd工具的全方位攻略，帮你快速提升工作效率！</span></a></li><li><a href="/xitong/1773420890a2701110.html"title='不再担心数据丢失，SayRecy帮你找回被遗忘的电脑文件！' aria-label='不再担心数据丢失，SayRecy帮你找回被遗忘的电脑文件！'><span class="sptit">不再担心数据丢失，SayRecy帮你找回被遗忘的电脑文件！</span></a></li><li><a href="/xitong/1773549790a2702540.html"title='一步到位：Mac用户轻松清理Apple缓存，提升性能！' aria-label='一步到位：Mac用户轻松清理Apple缓存，提升性能！'><span class="sptit">一步到位：Mac用户轻松清理Apple缓存，提升性能！</span></a></li><li><a href="/biancheng/1773559479a2702643.html"title='从Canon CR2到IFD0：探索RAW图片格式的内部构造' aria-label='从Canon CR2到IFD0：探索RAW图片格式的内部构造'><span class="sptit">从Canon CR2到IFD0：探索RAW图片格式的内部构造</span></a></li><li><a href="/biancheng/1773592815a2703029.html"title='厂里资讯热点：聚焦Flash技术，深度解析Adobe Flash Player的最新趋势' aria-label='厂里资讯热点：聚焦Flash技术，深度解析Adobe Flash Player的最新趋势'><span class="sptit">厂里资讯热点：聚焦Flash技术，深度解析Adobe Flash Player的最新趋势</span></a></li><li><a href="/xitong/1773603864a2703153.html"title='硬盘性能比较指南，助你做出明智选择' aria-label='硬盘性能比较指南，助你做出明智选择'><span class="sptit">硬盘性能比较指南，助你做出明智选择</span></a></li><li><a href="/biancheng/1773605093a2703157.html"title='SWF硬盘谁最强？全面比较与解析' aria-label='SWF硬盘谁最强？全面比较与解析'><span class="sptit">SWF硬盘谁最强？全面比较与解析</span></a></li></ul></div></div><div class="fzithome-com clear"></div><div class="widget widget_tags"><h4 class="bar">标签列表</h4><ul><li class="submenu"><a target="_blank" href="/tag/245239.html">电压监视</a></li><li class="submenu"><a target="_blank" href="/tag/245201.html">跟着指南</a></li><li class="submenu"><a target="_blank" href="/tag/245160.html">被加载到</a></li><li class="submenu"><a target="_blank" href="/tag/245023.html">系统中让</a></li><li class="submenu"><a target="_blank" href="/tag/245018.html">骤让你网</a></li><li class="submenu"><a target="_blank" href="/tag/245009.html">被强制下</a></li><li class="submenu"><a target="_blank" href="/tag/245002.html">地址的位</a></li><li class="submenu"><a target="_blank" href="/tag/244968.html">全面系统</a></li><li class="submenu"><a target="_blank" href="/tag/244948.html">函数功能</a></li><li class="submenu"><a target="_blank" href="/tag/244913.html">新建磁盘</a></li><li class="submenu"><a target="_blank" href="/tag/244866.html">恢复方案</a></li><li class="submenu"><a target="_blank" href="/tag/244856.html">目录是否</a></li><li class="submenu"><a target="_blank" href="/tag/244849.html">停电后的</a></li><li class="submenu"><a target="_blank" href="/tag/244845.html">修复照片</a></li><li class="submenu"><a target="_blank" href="/tag/244813.html">盘问题</a></li><li class="submenu"><a target="_blank" href="/tag/244810.html">功能窗口</a></li><li class="submenu"><a target="_blank" href="/tag/244808.html">自己做个</a></li><li class="submenu"><a target="_blank" href="/tag/244773.html">件下载功</a></li><li class="submenu"><a target="_blank" href="/tag/244762.html">耳机插在</a></li><li class="submenu"><a target="_blank" href="/tag/244761.html">也检测不</a></li></ul></div><div class="fzithome-com clear"></div></div></div><footer id="footer"><div class="footer container-w cl"><div class="fnav"></div><span class="copy">

            CopyRight © 2022 All Rights Reserved

            <a href="/" title="福州电脑网_福州电脑维修_福州电脑之家_福州iThome" target="_blank">福州电脑网_福州电脑维修_福州电脑之家_福州iThome</a></span>
        备案号：<a target="_blank" rel="nofollow" href="https://beian.miit.gov.cn/" style="font-size: 12px;">豫ICP备2022026798号-13</a></div></footer><script src="/view/template/mitiqin/js/common.min.js?2.3.0"></script><script src="/view/js/xiuno.js"></script><script src="/view/template/mitiqin/js/app.js?2.3.0"></script><div id="gotop"><div style="display: none; margin-bottom:5px;" id="goTopBtn"><a title="返回顶部" class="gotopa"><span class="iconfont icon-rocket-fill"></span></a></div></div></body></html>