hadoop大数据入门 - wtdig/study GitHub Wiki
1)hadoop数据的关注点:大数据的存储;并行计算模型====》分布式文件系统:HDFS;并行计算模型:mapreduce
2)hadoop的组成部分:commom模块,hdfs模块,mapreduce模块,yarn模块(调度功能)
3)hadoop有三种配置方式:1、本地模式;2、伪分布式;3、完全分布式
4)本地模式使用的文件系统是:本机的文件系统;伪分布式使用的文件系统:单一节点的hdfs文件系统;完全分布式使用的文件系统是:多个节点的hdfs文件系统
5)hdfs的高可用性,采取的方式是,一个文件会存储成三份副本,保证数据不丢失
6)hdfs的文件路径是虚拟的文件路径,具体的存储路径是根据实际存储在服务器节点的物理机的磁盘上
7)hadoop启动后的进程为5个进程:1、nameNode 名称节点 2、dataNode 数据节点 3、Secondary NameNode 辅助名称节点 4、ResourceManage 资源管理器 5、NodeManager 节点管理器
8)一般,情况下,hadoop进行集群时,将一台服务器作为名称节点(相当于一个目录),另一个不一样的服务器作为JObTracer(调度),前两台都是master,后面的机器作为数据节点,作为slave.
wget http://mirror.bit.edu.cn/apache/hadoop/common/hadoop-2.7.7/hadoop-2.7.7.tar.gz
tar -zxvf hadoop-2.7.7.tar.gz -C /usr/wt/hadoop/
/usr/wt/hadoop/hadoop-2.7.7/etc/hadoop
在etc/profile文件夹下,配置
# hadoop
export HADOOP_HOME=/usr/wt/hadoop/hadoop-2.7.7
export PATH=$PATH:$HADOOP_HOME/bin:$HADOOP_HOME/sbin
source /etc/profile 使其生效
core-site.xml
指定hdfs的路径、hadoop初始化的名称节点的位置
<property>
<name>fs.defaultFS</name>
<value>hdfs://localhost:9000</value>
</property>
<property>
<name>hadoop.tmp.dir</name>
<value>/var/tmp/hadoop/hadoop-${user.name}</value>
</property>
hdfs-site.xml
配置备份数为1
<property>
<name>dfs.replication</name>
<value>1</value>
</property>
yarn-site.xml
指定使用的mapreduce
<property>
<name>yarn.nodemanager.aux-services</name>
<value>mapreduce_shuffle</value>
</property>
复制一个mapred-site.xml文件、配置指定的调度yarn
copy mapred-site.xml.template mapred-site.xml
<property>
<name>mapreduce.framework.name</name>
<value>yarn</value>
</property>
修改hadoop运行时的jdk
hadoop-env.sh
export JAVA_HOME=/usr/wt/java/jdk1.8.0_171
ssh localhost
看是否需要密码,如果需要,使用如下命令
ssh-keygen -t rsa -P '' -f ~/.ssh/id_rsa
cat ~/.ssh/id_rsa.pub >> ~/.ssh/authorized_keys
chmod 0600 ~/.ssh/authorized_keys
在次使用ssh localhost,看是否可以无需密码登陆
hdfs namenode -format
start-all.sh
jps
2098 DataNode
2754 NodeManager
2293 SecondaryNameNode
2461 ResourceManager
50846 Jps
1951 NameNode
如果NameNode没有启动,在hadoop的logs中查看hadoop-root-namenode-hadoop0.log
如果错误是:org.apache.hadoop.hdfs.server.common.InconsistentFSStateException: Directory /tmp/hadoop-root/dfs/name is in an inconsistent state: storage directory does not exist or is not accessible.
在core-site.xml中加入
hadoop.tmp.dir /var/tmp/hadoop/hadoop-${user.name}https://archive.apache.org/dist/hadoop/common/hadoop-2.7.2/hadoop-2.7.2.tar.gz
解压到指定文件
配置环境变量:
HADOOP_HOME=D:\hadoop\hadoop-2.7.2
path:%HADOOP_HOME%\bin
下载window中需要的文件:
下载bin里面的文件:https://github.com/srccodes/hadoop-common-2.2.0-bin
将bin中的文件复制到hadoop的bin下
编写代码
package com.hadoop.tempearture;
/**
* mapper函数
*/
import org.apache.hadoop.io.IntWritable;
import org.apache.hadoop.io.LongWritable;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.mapreduce.Mapper;
import java.io.IOException;
public class MaxTemperatureMapper extends Mapper<LongWritable, Text, Text, IntWritable> {
//注1
private static final int MISSING = 9999;
@Override
public void map(LongWritable key, Text value, Context context) throws IOException, InterruptedException {
String line = value.toString();
//获取年份
String year = line.substring(15, 19);
//获取气温的正负值
int airTemperature;
if (line.charAt(87) == '+') {
// parseInt doesn't like leading plus signs
airTemperature = Integer.parseInt(line.substring(88, 92));
} else {
airTemperature = Integer.parseInt(line.substring(87, 92));
}
//获取气温的质量参数
String quality = line.substring(92, 93);
//筛选异常的数据
if (airTemperature != MISSING && quality.matches("[01459]")) {
context.write(new Text(year), new IntWritable(airTemperature));
}
}
}
package com.hadoop.tempearture;
/**
* reduce函数
*/
import org.apache.hadoop.io.IntWritable;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.mapreduce.Reducer;
import java.io.IOException;
public class MaxTemperatureReducer extends Reducer<Text, IntWritable, Text, IntWritable> {
@Override
public void reduce(Text key, Iterable<IntWritable> values, Context context)
throws IOException, InterruptedException {
int maxValue = Integer.MIN_VALUE;
//获取每个年份最大的气温值
for (IntWritable value : values) {
maxValue = Math.max(maxValue, value.get());
}
context.write(key, new IntWritable(maxValue));
}
}
package com.hadoop.tempearture;
/**
* 本mr主要功能,根据原始的气温信息,计算每年的最大气温
* <br>
* <span>map阶段:读取指定路径的输入文本,将每行记录作为一个value,偏移量作为key,通过筛选,将年份作为key,气温值作为value,输出到reduce中</span>
* <span>reduce阶段:map阶段输出的key,value,在reduce阶段进行聚合,年份依旧作为key,将相同年份的最大气温输出作为value,输出到指定的输出文件中</span>
* </br>
*/
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.IntWritable;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.mapreduce.Job;
import org.apache.hadoop.mapreduce.lib.input.FileInputFormat;
import org.apache.hadoop.mapreduce.lib.output.FileOutputFormat;
public class MaxTemperature {
public static void main(String[] args) throws Exception {
if (args.length != 2) {
System.err.println("Usage: MaxTemperature <input path> <output path>");
System.exit(-1);
}
//创建一个job实例
Job job = Job.getInstance();
//设置调度的主函数
job.setJarByClass(MaxTemperature.class);
job.setJobName("Max temperature");
//设置输入和输出
FileInputFormat.addInputPath(job, new Path(args[0]));
FileOutputFormat.setOutputPath(job, new Path(args[1]));
//设置map函数
job.setMapperClass(MaxTemperatureMapper.class);
//设置reduce函数
job.setReducerClass(MaxTemperatureReducer.class);
//设置输出的key类型
job.setOutputKeyClass(Text.class);
//设置输出的value类型
job.setOutputValueClass(IntWritable.class);
//执行job任务
System.exit(job.waitForCompletion(true) ? 0 : 1);
}
}
配置参数:
Program arguments
D:/alibababank/hadoop/maxtep/input
D:/alibababank/hadoop/maxtep/output
Main class
com.hadoop.tempearture.MaxTemperature
output文件夹不需要建立,每次执行完都需要删除该目录;
其中input文件夹需要提前新建;里面放入输入数据:
simple.txt
0067011990999992016051507004+68750+023550FM-12+038299999V0203301N00671220001CN9999999N9+00001+99999999999
0043011990999992016051512004+68750+023550FM-12+038299999V0203201N00671220001CN9999999N9+07771+99999999999
0043011990999992016051518004+68750+023550FM-12+038299999V0203201N00261220001CN9999999N9-07771+99999999999
0043012650999992017032412004+62300+010750FM-12+048599999V0202701N00461220001CN0500001N9+08881+99999999999
0043012650999992017032418004+62300+010750FM-12+048599999V0202701N00461220001CN0500001N9+00781+99999999999
0043012650999992018032418004+62300+010750FM-12+048599999V0202701N00461220001CN0500001N9+09991+99999999999
0043012650999992018032418004+62300+010750FM-12+048599999V0202701N00461220001CN0500001N9+00011+99999999999
使用配置的参数,运行主函数:
如果发现缺少window的文件,重启电脑后,再次执行;
如果hadoop in thread "main" java.lang.UnsatisfiedLinkError: org.apache.hadoop.io.nativeio.NativeIO$Windows.access0(Ljava/lang/String;I)Z
那么在src下新建org.apache.hadoop.io.nativeio包,里面放入一下代码
主要是修改:永远返回 true
public static boolean access(String path, NativeIO.Windows.AccessRight desiredAccess) throws IOException {
//return access0(path, desiredAccess.accessRight());
return true;
}
修改后的代码
//
// Source code recreated from a .class file by IntelliJ IDEA
// (powered by Fernflower decompiler)
//
package org.apache.hadoop.io.nativeio;
import com.google.common.annotations.VisibleForTesting;
import java.io.Closeable;
import java.io.File;
import java.io.FileDescriptor;
import java.io.FileInputStream;
import java.io.FileOutputStream;
import java.io.IOException;
import java.io.RandomAccessFile;
import java.lang.reflect.Field;
import java.nio.ByteBuffer;
import java.nio.MappedByteBuffer;
import java.nio.channels.FileChannel;
import java.util.Map;
import java.util.concurrent.ConcurrentHashMap;
import org.apache.commons.logging.Log;
import org.apache.commons.logging.LogFactory;
import org.apache.hadoop.classification.InterfaceAudience.Private;
import org.apache.hadoop.classification.InterfaceStability.Unstable;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.HardLink;
import org.apache.hadoop.io.IOUtils;
import org.apache.hadoop.io.SecureIOUtils.AlreadyExistsException;
import org.apache.hadoop.util.NativeCodeLoader;
import org.apache.hadoop.util.PerformanceAdvisory;
import org.apache.hadoop.util.Shell;
import sun.misc.Cleaner;
import sun.misc.Unsafe;
import sun.nio.ch.DirectBuffer;
@Private
@Unstable
public class NativeIO {
private static boolean workaroundNonThreadSafePasswdCalls = false;
private static final Log LOG = LogFactory.getLog(NativeIO.class);
private static boolean nativeLoaded = false;
private static final Map<Long, NativeIO.CachedUid> uidCache;
private static long cacheTimeout;
private static boolean initialized;
public NativeIO() {
}
public static boolean isAvailable() {
return NativeCodeLoader.isNativeCodeLoaded() && nativeLoaded;
}
private static native void initNative();
static long getMemlockLimit() {
return isAvailable() ? getMemlockLimit0() : 0L;
}
private static native long getMemlockLimit0();
static long getOperatingSystemPageSize() {
try {
Field f = Unsafe.class.getDeclaredField("theUnsafe");
f.setAccessible(true);
Unsafe unsafe = (Unsafe)f.get((Object)null);
return (long)unsafe.pageSize();
} catch (Throwable var2) {
LOG.warn("Unable to get operating system page size. Guessing 4096.", var2);
return 4096L;
}
}
private static String stripDomain(String name) {
int i = name.indexOf(92);
if (i != -1) {
name = name.substring(i + 1);
}
return name;
}
public static String getOwner(FileDescriptor fd) throws IOException {
ensureInitialized();
if (Shell.WINDOWS) {
String owner = NativeIO.Windows.getOwner(fd);
owner = stripDomain(owner);
return owner;
} else {
long uid = NativeIO.POSIX.getUIDforFDOwnerforOwner(fd);
NativeIO.CachedUid cUid = (NativeIO.CachedUid)uidCache.get(uid);
long now = System.currentTimeMillis();
if (cUid != null && cUid.timestamp + cacheTimeout > now) {
return cUid.username;
} else {
String user = NativeIO.POSIX.getUserName(uid);
LOG.info("Got UserName " + user + " for UID " + uid + " from the native implementation");
cUid = new NativeIO.CachedUid(user, now);
uidCache.put(uid, cUid);
return user;
}
}
}
public static FileInputStream getShareDeleteFileInputStream(File f) throws IOException {
if (!Shell.WINDOWS) {
return new FileInputStream(f);
} else {
FileDescriptor fd = NativeIO.Windows.createFile(f.getAbsolutePath(), 2147483648L, 7L, 3L);
return new FileInputStream(fd);
}
}
public static FileInputStream getShareDeleteFileInputStream(File f, long seekOffset) throws IOException {
if (!Shell.WINDOWS) {
RandomAccessFile rf = new RandomAccessFile(f, "r");
if (seekOffset > 0L) {
rf.seek(seekOffset);
}
return new FileInputStream(rf.getFD());
} else {
FileDescriptor fd = NativeIO.Windows.createFile(f.getAbsolutePath(), 2147483648L, 7L, 3L);
if (seekOffset > 0L) {
NativeIO.Windows.setFilePointer(fd, seekOffset, 0L);
}
return new FileInputStream(fd);
}
}
public static FileOutputStream getCreateForWriteFileOutputStream(File f, int permissions) throws IOException {
FileDescriptor fd;
if (!Shell.WINDOWS) {
try {
fd = NativeIO.POSIX.open(f.getAbsolutePath(), 193, permissions);
return new FileOutputStream(fd);
} catch (NativeIOException var4) {
if (var4.getErrno() == Errno.EEXIST) {
throw new AlreadyExistsException(var4);
} else {
throw var4;
}
}
} else {
try {
fd = NativeIO.Windows.createFile(f.getCanonicalPath(), 1073741824L, 7L, 1L);
NativeIO.POSIX.chmod(f.getCanonicalPath(), permissions);
return new FileOutputStream(fd);
} catch (NativeIOException var3) {
if (var3.getErrorCode() == 80L) {
throw new AlreadyExistsException(var3);
} else {
throw var3;
}
}
}
}
private static synchronized void ensureInitialized() {
if (!initialized) {
cacheTimeout = (new Configuration()).getLong("hadoop.security.uid.cache.secs", 14400L) * 1000L;
LOG.info("Initialized cache for UID to User mapping with a cache timeout of " + cacheTimeout / 1000L + " seconds.");
initialized = true;
}
}
public static void renameTo(File src, File dst) throws IOException {
if (!nativeLoaded) {
if (!src.renameTo(dst)) {
throw new IOException("renameTo(src=" + src + ", dst=" + dst + ") failed.");
}
} else {
renameTo0(src.getAbsolutePath(), dst.getAbsolutePath());
}
}
public static void link(File src, File dst) throws IOException {
if (!nativeLoaded) {
HardLink.createHardLink(src, dst);
} else {
link0(src.getAbsolutePath(), dst.getAbsolutePath());
}
}
private static native void renameTo0(String var0, String var1) throws NativeIOException;
private static native void link0(String var0, String var1) throws NativeIOException;
public static void copyFileUnbuffered(File src, File dst) throws IOException {
if (nativeLoaded && Shell.WINDOWS) {
copyFileUnbuffered0(src.getAbsolutePath(), dst.getAbsolutePath());
} else {
FileInputStream fis = null;
FileOutputStream fos = null;
FileChannel input = null;
FileChannel output = null;
try {
fis = new FileInputStream(src);
fos = new FileOutputStream(dst);
input = fis.getChannel();
output = fos.getChannel();
long remaining = input.size();
long position = 0L;
for(long transferred = 0L; remaining > 0L; position += transferred) {
transferred = input.transferTo(position, remaining, output);
remaining -= transferred;
}
} finally {
IOUtils.cleanup(LOG, new Closeable[]{output});
IOUtils.cleanup(LOG, new Closeable[]{fos});
IOUtils.cleanup(LOG, new Closeable[]{input});
IOUtils.cleanup(LOG, new Closeable[]{fis});
}
}
}
private static native void copyFileUnbuffered0(String var0, String var1) throws NativeIOException;
static {
if (NativeCodeLoader.isNativeCodeLoaded()) {
try {
initNative();
nativeLoaded = true;
} catch (Throwable var1) {
PerformanceAdvisory.LOG.debug("Unable to initialize NativeIO libraries", var1);
}
}
uidCache = new ConcurrentHashMap();
initialized = false;
}
private static class CachedUid {
final long timestamp;
final String username;
public CachedUid(String username, long timestamp) {
this.timestamp = timestamp;
this.username = username;
}
}
public static class Windows {
public static final long GENERIC_READ = 2147483648L;
public static final long GENERIC_WRITE = 1073741824L;
public static final long FILE_SHARE_READ = 1L;
public static final long FILE_SHARE_WRITE = 2L;
public static final long FILE_SHARE_DELETE = 4L;
public static final long CREATE_NEW = 1L;
public static final long CREATE_ALWAYS = 2L;
public static final long OPEN_EXISTING = 3L;
public static final long OPEN_ALWAYS = 4L;
public static final long TRUNCATE_EXISTING = 5L;
public static final long FILE_BEGIN = 0L;
public static final long FILE_CURRENT = 1L;
public static final long FILE_END = 2L;
public static final long FILE_ATTRIBUTE_NORMAL = 128L;
public Windows() {
}
public static void createDirectoryWithMode(File path, int mode) throws IOException {
createDirectoryWithMode0(path.getAbsolutePath(), mode);
}
private static native void createDirectoryWithMode0(String var0, int var1) throws NativeIOException;
public static native FileDescriptor createFile(String var0, long var1, long var3, long var5) throws IOException;
public static FileOutputStream createFileOutputStreamWithMode(File path, boolean append, int mode) throws IOException {
long desiredAccess = 1073741824L;
long shareMode = 3L;
long creationDisposition = append ? 4L : 2L;
return new FileOutputStream(createFileWithMode0(path.getAbsolutePath(), desiredAccess, shareMode, creationDisposition, mode));
}
private static native FileDescriptor createFileWithMode0(String var0, long var1, long var3, long var5, int var7) throws NativeIOException;
public static native long setFilePointer(FileDescriptor var0, long var1, long var3) throws IOException;
private static native String getOwner(FileDescriptor var0) throws IOException;
private static native boolean access0(String var0, int var1);
public static boolean access(String path, NativeIO.Windows.AccessRight desiredAccess) throws IOException {
//return access0(path, desiredAccess.accessRight());
return true;
}
public static native void extendWorkingSetSize(long var0) throws IOException;
static {
if (NativeCodeLoader.isNativeCodeLoaded()) {
try {
NativeIO.initNative();
NativeIO.nativeLoaded = true;
} catch (Throwable var1) {
PerformanceAdvisory.LOG.debug("Unable to initialize NativeIO libraries", var1);
}
}
}
public static enum AccessRight {
ACCESS_READ(1),
ACCESS_WRITE(2),
ACCESS_EXECUTE(32);
private final int accessRight;
private AccessRight(int access) {
this.accessRight = access;
}
public int accessRight() {
return this.accessRight;
}
}
}
public static class POSIX {
public static final int O_RDONLY = 0;
public static final int O_WRONLY = 1;
public static final int O_RDWR = 2;
public static final int O_CREAT = 64;
public static final int O_EXCL = 128;
public static final int O_NOCTTY = 256;
public static final int O_TRUNC = 512;
public static final int O_APPEND = 1024;
public static final int O_NONBLOCK = 2048;
public static final int O_SYNC = 4096;
public static final int O_ASYNC = 8192;
public static final int O_FSYNC = 4096;
public static final int O_NDELAY = 2048;
public static final int POSIX_FADV_NORMAL = 0;
public static final int POSIX_FADV_RANDOM = 1;
public static final int POSIX_FADV_SEQUENTIAL = 2;
public static final int POSIX_FADV_WILLNEED = 3;
public static final int POSIX_FADV_DONTNEED = 4;
public static final int POSIX_FADV_NOREUSE = 5;
public static final int SYNC_FILE_RANGE_WAIT_BEFORE = 1;
public static final int SYNC_FILE_RANGE_WRITE = 2;
public static final int SYNC_FILE_RANGE_WAIT_AFTER = 4;
private static final Log LOG = LogFactory.getLog(NativeIO.class);
private static boolean nativeLoaded = false;
private static boolean fadvisePossible = true;
private static boolean syncFileRangePossible = true;
static final String WORKAROUND_NON_THREADSAFE_CALLS_KEY = "hadoop.workaround.non.threadsafe.getpwuid";
static final boolean WORKAROUND_NON_THREADSAFE_CALLS_DEFAULT = true;
private static long cacheTimeout = -1L;
private static NativeIO.POSIX.CacheManipulator cacheManipulator = new NativeIO.POSIX.CacheManipulator();
private static final Map<Integer, NativeIO.POSIX.CachedName> USER_ID_NAME_CACHE;
private static final Map<Integer, NativeIO.POSIX.CachedName> GROUP_ID_NAME_CACHE;
public static final int MMAP_PROT_READ = 1;
public static final int MMAP_PROT_WRITE = 2;
public static final int MMAP_PROT_EXEC = 4;
public POSIX() {
}
public static NativeIO.POSIX.CacheManipulator getCacheManipulator() {
return cacheManipulator;
}
public static void setCacheManipulator(NativeIO.POSIX.CacheManipulator cacheManipulator) {
cacheManipulator = cacheManipulator;
}
public static boolean isAvailable() {
return NativeCodeLoader.isNativeCodeLoaded() && nativeLoaded;
}
private static void assertCodeLoaded() throws IOException {
if (!isAvailable()) {
throw new IOException("NativeIO was not loaded");
}
}
public static native FileDescriptor open(String var0, int var1, int var2) throws IOException;
private static native NativeIO.POSIX.Stat fstat(FileDescriptor var0) throws IOException;
private static native void chmodImpl(String var0, int var1) throws IOException;
public static void chmod(String path, int mode) throws IOException {
if (!Shell.WINDOWS) {
chmodImpl(path, mode);
} else {
try {
chmodImpl(path, mode);
} catch (NativeIOException var3) {
if (var3.getErrorCode() == 3L) {
throw new NativeIOException("No such file or directory", Errno.ENOENT);
}
LOG.warn(String.format("NativeIO.chmod error (%d): %s", var3.getErrorCode(), var3.getMessage()));
throw new NativeIOException("Unknown error", Errno.UNKNOWN);
}
}
}
static native void posix_fadvise(FileDescriptor var0, long var1, long var3, int var5) throws NativeIOException;
static native void sync_file_range(FileDescriptor var0, long var1, long var3, int var5) throws NativeIOException;
static void posixFadviseIfPossible(String identifier, FileDescriptor fd, long offset, long len, int flags) throws NativeIOException {
if (nativeLoaded && fadvisePossible) {
try {
posix_fadvise(fd, offset, len, flags);
} catch (UnsupportedOperationException var8) {
fadvisePossible = false;
} catch (UnsatisfiedLinkError var9) {
fadvisePossible = false;
}
}
}
public static void syncFileRangeIfPossible(FileDescriptor fd, long offset, long nbytes, int flags) throws NativeIOException {
if (nativeLoaded && syncFileRangePossible) {
try {
sync_file_range(fd, offset, nbytes, flags);
} catch (UnsupportedOperationException var7) {
syncFileRangePossible = false;
} catch (UnsatisfiedLinkError var8) {
syncFileRangePossible = false;
}
}
}
static native void mlock_native(ByteBuffer var0, long var1) throws NativeIOException;
static void mlock(ByteBuffer buffer, long len) throws IOException {
assertCodeLoaded();
if (!buffer.isDirect()) {
throw new IOException("Cannot mlock a non-direct ByteBuffer");
} else {
mlock_native(buffer, len);
}
}
public static void munmap(MappedByteBuffer buffer) {
if (buffer instanceof DirectBuffer) {
Cleaner cleaner = ((DirectBuffer)buffer).cleaner();
cleaner.clean();
}
}
private static native long getUIDforFDOwnerforOwner(FileDescriptor var0) throws IOException;
private static native String getUserName(long var0) throws IOException;
public static NativeIO.POSIX.Stat getFstat(FileDescriptor fd) throws IOException {
NativeIO.POSIX.Stat stat = null;
if (!Shell.WINDOWS) {
stat = fstat(fd);
stat.owner = getName(NativeIO.POSIX.IdCache.USER, stat.ownerId);
stat.group = getName(NativeIO.POSIX.IdCache.GROUP, stat.groupId);
} else {
try {
stat = fstat(fd);
} catch (NativeIOException var3) {
if (var3.getErrorCode() == 6L) {
throw new NativeIOException("The handle is invalid.", Errno.EBADF);
}
LOG.warn(String.format("NativeIO.getFstat error (%d): %s", var3.getErrorCode(), var3.getMessage()));
throw new NativeIOException("Unknown error", Errno.UNKNOWN);
}
}
return stat;
}
private static String getName(NativeIO.POSIX.IdCache domain, int id) throws IOException {
Map<Integer, NativeIO.POSIX.CachedName> idNameCache = domain == NativeIO.POSIX.IdCache.USER ? USER_ID_NAME_CACHE : GROUP_ID_NAME_CACHE;
NativeIO.POSIX.CachedName cachedName = (NativeIO.POSIX.CachedName)idNameCache.get(id);
long now = System.currentTimeMillis();
String name;
if (cachedName != null && cachedName.timestamp + cacheTimeout > now) {
name = cachedName.name;
} else {
name = domain == NativeIO.POSIX.IdCache.USER ? getUserName(id) : getGroupName(id);
if (LOG.isDebugEnabled()) {
String type = domain == NativeIO.POSIX.IdCache.USER ? "UserName" : "GroupName";
LOG.debug("Got " + type + " " + name + " for ID " + id + " from the native implementation");
}
cachedName = new NativeIO.POSIX.CachedName(name, now);
idNameCache.put(id, cachedName);
}
return name;
}
static native String getUserName(int var0) throws IOException;
static native String getGroupName(int var0) throws IOException;
public static native long mmap(FileDescriptor var0, int var1, boolean var2, long var3) throws IOException;
public static native void munmap(long var0, long var2) throws IOException;
static {
if (NativeCodeLoader.isNativeCodeLoaded()) {
try {
Configuration conf = new Configuration();
NativeIO.workaroundNonThreadSafePasswdCalls = conf.getBoolean("hadoop.workaround.non.threadsafe.getpwuid", true);
NativeIO.initNative();
nativeLoaded = true;
cacheTimeout = conf.getLong("hadoop.security.uid.cache.secs", 14400L) * 1000L;
LOG.debug("Initialized cache for IDs to User/Group mapping with a cache timeout of " + cacheTimeout / 1000L + " seconds.");
} catch (Throwable var1) {
PerformanceAdvisory.LOG.debug("Unable to initialize NativeIO libraries", var1);
}
}
USER_ID_NAME_CACHE = new ConcurrentHashMap();
GROUP_ID_NAME_CACHE = new ConcurrentHashMap();
}
private static enum IdCache {
USER,
GROUP;
private IdCache() {
}
}
private static class CachedName {
final long timestamp;
final String name;
public CachedName(String name, long timestamp) {
this.name = name;
this.timestamp = timestamp;
}
}
public static class Stat {
private int ownerId;
private int groupId;
private String owner;
private String group;
private int mode;
public static final int S_IFMT = 61440;
public static final int S_IFIFO = 4096;
public static final int S_IFCHR = 8192;
public static final int S_IFDIR = 16384;
public static final int S_IFBLK = 24576;
public static final int S_IFREG = 32768;
public static final int S_IFLNK = 40960;
public static final int S_IFSOCK = 49152;
public static final int S_IFWHT = 57344;
public static final int S_ISUID = 2048;
public static final int S_ISGID = 1024;
public static final int S_ISVTX = 512;
public static final int S_IRUSR = 256;
public static final int S_IWUSR = 128;
public static final int S_IXUSR = 64;
Stat(int ownerId, int groupId, int mode) {
this.ownerId = ownerId;
this.groupId = groupId;
this.mode = mode;
}
Stat(String owner, String group, int mode) {
if (!Shell.WINDOWS) {
this.owner = owner;
} else {
this.owner = NativeIO.stripDomain(owner);
}
if (!Shell.WINDOWS) {
this.group = group;
} else {
this.group = NativeIO.stripDomain(group);
}
this.mode = mode;
}
public String toString() {
return "Stat(owner='" + this.owner + "', group='" + this.group + "'" + ", mode=" + this.mode + ")";
}
public String getOwner() {
return this.owner;
}
public String getGroup() {
return this.group;
}
public int getMode() {
return this.mode;
}
}
@VisibleForTesting
public static class NoMlockCacheManipulator extends NativeIO.POSIX.CacheManipulator {
public NoMlockCacheManipulator() {
}
public void mlock(String identifier, ByteBuffer buffer, long len) throws IOException {
NativeIO.POSIX.LOG.info("mlocking " + identifier);
}
public long getMemlockLimit() {
return 1125899906842624L;
}
public long getOperatingSystemPageSize() {
return 4096L;
}
public boolean verifyCanMlock() {
return true;
}
}
@VisibleForTesting
public static class CacheManipulator {
public CacheManipulator() {
}
public void mlock(String identifier, ByteBuffer buffer, long len) throws IOException {
NativeIO.POSIX.mlock(buffer, len);
}
public long getMemlockLimit() {
return NativeIO.getMemlockLimit();
}
public long getOperatingSystemPageSize() {
return NativeIO.getOperatingSystemPageSize();
}
public void posixFadviseIfPossible(String identifier, FileDescriptor fd, long offset, long len, int flags) throws NativeIOException {
NativeIO.POSIX.posixFadviseIfPossible(identifier, fd, offset, len, flags);
}
public boolean verifyCanMlock() {
return NativeIO.isAvailable();
}
}
}
}