1
=== modified file 'bundle.yaml'
2
--- bundle.yaml	2015-09-22 03:52:32 +0000
3
+++ bundle.yaml	2015-10-02 19:59:25 +0000
4
@@ -31,7 +31,7 @@
5
31
      gui-x: "900"
31
      gui-x: "900"
6
32
      gui-y: "200"
32
      gui-y: "200"
7
33
  rsyslog-forwarder:
33
  rsyslog-forwarder:
9
34
    charm: cs:trusty/rsyslog-forwarder-ha-4
34
    charm: cs:trusty/rsyslog-forwarder-ha-5
10
35
    annotations:
35
    annotations:
11
36
      gui-x: "900"
36
      gui-x: "900"
12
37
      gui-y: "600"
37
      gui-y: "600"
13
38
38
14
=== added directory 'tests'
15
=== added file 'tests/00-setup'
16
--- tests/00-setup	1970-01-01 00:00:00 +0000
17
+++ tests/00-setup	2015-10-02 19:59:25 +0000
18
@@ -0,0 +1,8 @@
19
1
#!/bin/bash
20
2
21
3
if ! python3 -c 'import amulet' &> /dev/null; then
22
4
    echo Installing Amulet...
23
5
    sudo add-apt-repository -y ppa:juju/stable
24
6
    sudo apt-get update
25
7
    sudo apt-get -y install amulet
26
8
fi
27
0
9
28
=== added file 'tests/01-bundle.py'
29
--- tests/01-bundle.py	1970-01-01 00:00:00 +0000
30
+++ tests/01-bundle.py	2015-10-02 19:59:25 +0000
31
@@ -0,0 +1,154 @@
32
1
#!/usr/bin/env python3
33
2
34
3
import re
35
4
import os
36
5
import unittest
37
6
import textwrap
38
7
39
8
import yaml
40
9
import amulet
41
10
42
11
43
12
class TestBundle(unittest.TestCase):
44
13
    bundle_file = os.path.join(os.path.dirname(__file__), '..', 'bundle.yaml')
45
14
46
15
    @classmethod
47
16
    def setUpClass(cls):
48
17
        cls.d = amulet.Deployment(series='trusty')
49
18
        with open(cls.bundle_file) as f:
50
19
            bun = f.read()
51
20
        bundle = yaml.safe_load(bun)
52
21
        cls.d.load(bundle)
53
22
        cls.d.setup(timeout=1800)
54
23
        cls.d.sentry.wait_for_messages({
55
24
            'compute-slave': 'Ready',
56
25
            'plugin': 'Ready',
57
26
            'zeppelin': 'Ready',
58
27
            'flume-syslog': 'Ready',
59
28
        }, timeout=1800)
60
29
        cls.hdfs = cls.d.sentry['hdfs-master'][0]
61
30
        cls.yarn = cls.d.sentry['yarn-master'][0]
62
31
        cls.slave = cls.d.sentry['compute-slave'][0]
63
32
        cls.secondary = cls.d.sentry['secondary-namenode'][0]
64
33
        cls.spark = cls.d.sentry['spark'][0]
65
34
        cls.zeppelin = cls.d.sentry['zeppelin'][0]
66
35
67
36
    def test_components(self):
68
37
        """
69
38
        Confirm that all of the required components are up and running.
70
39
        """
71
40
        hdfs, retcode = self.hdfs.run("pgrep -a java")
72
41
        yarn, retcode = self.yarn.run("pgrep -a java")
73
42
        slave, retcode = self.slave.run("pgrep -a java")
74
43
        secondary, retcode = self.secondary.run("pgrep -a java")
75
44
        spark, retcode = self.spark.run("pgrep -a java")
76
45
77
46
        # .NameNode needs the . to differentiate it from SecondaryNameNode
78
47
        assert '.NameNode' in hdfs, "NameNode not started"
79
48
        assert '.NameNode' not in yarn, "NameNode should not be running on yarn-master"
80
49
        assert '.NameNode' not in slave, "NameNode should not be running on compute-slave"
81
50
        assert '.NameNode' not in secondary, "NameNode should not be running on secondary-namenode"
82
51
        assert '.NameNode' not in spark, "NameNode should not be running on spark"
83
52
84
53
        assert 'ResourceManager' in yarn, "ResourceManager not started"
85
54
        assert 'ResourceManager' not in hdfs, "ResourceManager should not be running on hdfs-master"
86
55
        assert 'ResourceManager' not in slave, "ResourceManager should not be running on compute-slave"
87
56
        assert 'ResourceManager' not in secondary, "ResourceManager should not be running on secondary-namenode"
88
57
        assert 'ResourceManager' not in spark, "ResourceManager should not be running on spark"
89
58
90
59
        assert 'JobHistoryServer' in yarn, "JobHistoryServer not started"
91
60
        assert 'JobHistoryServer' not in hdfs, "JobHistoryServer should not be running on hdfs-master"
92
61
        assert 'JobHistoryServer' not in slave, "JobHistoryServer should not be running on compute-slave"
93
62
        assert 'JobHistoryServer' not in secondary, "JobHistoryServer should not be running on secondary-namenode"
94
63
        assert 'JobHistoryServer' not in spark, "JobHistoryServer should not be running on spark"
95
64
96
65
        assert 'NodeManager' in slave, "NodeManager not started"
97
66
        assert 'NodeManager' not in yarn, "NodeManager should not be running on yarn-master"
98
67
        assert 'NodeManager' not in hdfs, "NodeManager should not be running on hdfs-master"
99
68
        assert 'NodeManager' not in secondary, "NodeManager should not be running on secondary-namenode"
100
69
        assert 'NodeManager' not in spark, "NodeManager should not be running on spark"
101
70
102
71
        assert 'DataNode' in slave, "DataServer not started"
103
72
        assert 'DataNode' not in yarn, "DataNode should not be running on yarn-master"
104
73
        assert 'DataNode' not in hdfs, "DataNode should not be running on hdfs-master"
105
74
        assert 'DataNode' not in secondary, "DataNode should not be running on secondary-namenode"
106
75
        assert 'DataNode' not in spark, "DataNode should not be running on spark"
107
76
108
77
        assert 'SecondaryNameNode' in secondary, "SecondaryNameNode not started"
109
78
        assert 'SecondaryNameNode' not in yarn, "SecondaryNameNode should not be running on yarn-master"
110
79
        assert 'SecondaryNameNode' not in hdfs, "SecondaryNameNode should not be running on hdfs-master"
111
80
        assert 'SecondaryNameNode' not in slave, "SecondaryNameNode should not be running on compute-slave"
112
81
        assert 'SecondaryNameNode' not in spark, "SecondaryNameNode should not be running on spark"
113
82
114
83
        assert 'spark' in spark, 'Spark should be running on spark'
115
84
        assert 'zeppelin' in spark, 'Zeppelin should be running on spark'
116
85
117
86
    def test_hdfs_dir(self):
118
87
        """
119
88
        Validate admin few hadoop activities on HDFS cluster.
120
89
            1) This test validates mkdir on hdfs cluster
121
90
            2) This test validates change hdfs dir owner on the cluster
122
91
            3) This test validates setting hdfs directory access permission on the cluster
123
92
124
93
        NB: These are order-dependent, so must be done as part of a single test case.
125
94
        """
126
95
        output, retcode = self.spark.run("su hdfs -c 'hdfs dfs -mkdir -p /user/ubuntu'")
127
96
        assert retcode == 0, "Created a user directory on hdfs FAILED:\n{}".format(output)
128
97
        output, retcode = self.spark.run("su hdfs -c 'hdfs dfs -chown ubuntu:ubuntu /user/ubuntu'")
129
98
        assert retcode == 0, "Assigning an owner to hdfs directory FAILED:\n{}".format(output)
130
99
        output, retcode = self.spark.run("su hdfs -c 'hdfs dfs -chmod -R 755 /user/ubuntu'")
131
100
        assert retcode == 0, "seting directory permission on hdfs FAILED:\n{}".format(output)
132
101
        output, retcode = self.spark.run("su hdfs -c 'hdfs dfs -rmdir /user/ubuntu'")
133
102
134
103
    def test_yarn_mapreduce_exe(self):
135
104
        """
136
105
        Validate yarn mapreduce operations:
137
106
            1) validate mapreduce execution - writing to hdfs
138
107
            2) validate successful mapreduce operation after the execution
139
108
            3) validate mapreduce execution - reading and writing to hdfs
140
109
            4) validate successful mapreduce operation after the execution
141
110
            5) validate successful deletion of mapreduce operation result from hdfs
142
111
143
112
        NB: These are order-dependent, so must be done as part of a single test case.
144
113
        """
145
114
        jar_file = '/usr/lib/hadoop/share/hadoop/mapreduce/hadoop-mapreduce-examples-*.jar'
146
115
        test_steps = [
147
116
            ('teragen',      "su ubuntu -c 'hadoop jar {} teragen  10000 /user/ubuntu/teragenout'".format(jar_file)),
148
117
            ('mapreduce #1', "su hdfs -c 'hdfs dfs -ls /user/ubuntu/teragenout/_SUCCESS'"),
149
118
            ('terasort',     "su ubuntu -c 'hadoop jar {} terasort /user/ubuntu/teragenout /user/ubuntu/terasortout'".
150
119
                format(jar_file)),
151
120
            ('mapreduce #2', "su hdfs -c 'hdfs dfs -ls /user/ubuntu/terasortout/_SUCCESS'"),
152
121
            ('cleanup',      "su hdfs -c 'hdfs dfs -rm -r /user/ubuntu/teragenout'"),
153
122
        ]
154
123
        for name, step in test_steps:
155
124
            output, retcode = self.spark.run(step)
156
125
            assert retcode == 0, "{} FAILED:\n{}".format(name, output)
157
126
158
127
    def test_spark(self):
159
128
        output, retcode = self.spark.run("su ubuntu -c 'bash -lc /home/ubuntu/sparkpi.sh 2>&1'")
160
129
        assert 'Pi is roughly' in output, 'SparkPI test failed: %s' % output
161
130
162
131
    def test_ingest(self):
163
132
        self.spark.ssh('ls /home/ubuntu')  # ensure at least one pure ssh session for the logs
164
133
        for i in amulet.helpers.timeout_gen(60 * 5):  # wait for the log messages to be ingested
165
134
            output, retcode = self.spark.run("su hdfs -c 'hdfs dfs -ls /user/flume/flume-syslog/*/*'")
166
135
            if retcode == 0 and 'FlumeData' in output:
167
136
                break
168
137
169
138
        ssh_count = textwrap.dedent("""
170
139
            from pyspark import SparkContext
171
140
            sc = SparkContext(appName="ssh-count")
172
141
            count = sc.textFile("/user/flume/flume-syslog/*/*").filter(lambda line: "sshd" in line).count()
173
142
            print "SSH Logins: %s" % count
174
143
        """)
175
144
        output, retcode = self.spark.run("cat << EOP > /home/ubuntu/ssh-count.py\n{}\nEOP".format(ssh_count))
176
145
        assert retcode == 0
177
146
        output, retcode = self.spark.run("su ubuntu -c 'spark-submit --master yarn-client /home/ubuntu/ssh-count.py'")
178
147
        assert re.search(r'SSH Logins: [1-9][0-9]*', output), 'ssh-count.py failed: %s' % output
179
148
180
149
    def test_zeppelin(self):
181
150
        pass  # requires javascript; how to test?
182
151
183
152
184
153
if __name__ == '__main__':
185
154
    unittest.main()
Reviewer	Review Type	Date Requested	Status
Tim Van Steenburgh (community)		2015-10-02	Approve on 2015-10-03
Review via email: mp+273290@code.launchpad.net