Skip to content

Commit 31fde6f

Browse files
authored
Merge pull request #133 from sarfata/bugfix/esp-crashes
Bugfix/esp crashes
2 parents c041cb3 + 48ee98b commit 31fde6f

File tree

9 files changed

+184
-90
lines changed

9 files changed

+184
-90
lines changed

README.md

+5
Original file line numberDiff line numberDiff line change
@@ -192,6 +192,11 @@ been possible!**
192192

193193
## Changelog
194194

195+
* 2018 04 25 - v1.2.4
196+
* Improved WiFi connection stability
197+
This required the latest version of ESP firmware.
198+
And also some changes to the TCP/NMEA server.
199+
* #96: make wifi led go green when we have a websocket client connected
195200
* 2018 04 23 - v1.2.3
196201
* Repeat all NMEA and NMEA2000 data to the computer when the serial port is
197202
opened at 38400 bauds.

esp-crash.py

+138
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,138 @@
1+
#!/usr/bin/env python
2+
3+
import argparse
4+
import re
5+
import os
6+
import subprocess
7+
import sys
8+
9+
10+
class ESPCrashParser(object):
11+
ESP_EXCEPTIONS = [
12+
"Illegal instruction",
13+
"SYSCALL instruction",
14+
"InstructionFetchError: Processor internal physical address or data error during instruction fetch",
15+
"LoadStoreError: Processor internal physical address or data error during load or store",
16+
"Level1Interrupt: Level-1 interrupt as indicated by set level-1 bits in the INTERRUPT register",
17+
"Alloca: MOVSP instruction, if caller's registers are not in the register file",
18+
"IntegerDivideByZero: QUOS, QUOU, REMS, or REMU divisor operand is zero",
19+
"reserved",
20+
"Privileged: Attempt to execute a privileged operation when CRING ? 0",
21+
"LoadStoreAlignmentCause: Load or store to an unaligned address",
22+
"reserved",
23+
"reserved",
24+
"InstrPIFDataError: PIF data error during instruction fetch",
25+
"LoadStorePIFDataError: Synchronous PIF data error during LoadStore access",
26+
"InstrPIFAddrError: PIF address error during instruction fetch",
27+
"LoadStorePIFAddrError: Synchronous PIF address error during LoadStore access",
28+
"InstTLBMiss: Error during Instruction TLB refill",
29+
"InstTLBMultiHit: Multiple instruction TLB entries matched",
30+
"InstFetchPrivilege: An instruction fetch referenced a virtual address at a ring level less than CRING",
31+
"reserved",
32+
"InstFetchProhibited: An instruction fetch referenced a page mapped with an attribute that does not permit instruction fetch",
33+
"reserved",
34+
"reserved",
35+
"reserved",
36+
"LoadStoreTLBMiss: Error during TLB refill for a load or store",
37+
"LoadStoreTLBMultiHit: Multiple TLB entries matched for a load or store",
38+
"LoadStorePrivilege: A load or store referenced a virtual address at a ring level less than CRING",
39+
"reserved",
40+
"LoadProhibited: A load referenced a page mapped with an attribute that does not permit loads",
41+
"StoreProhibited: A store referenced a page mapped with an attribute that does not permit stores"
42+
]
43+
44+
def __init__(self, toolchain_path, elf_path):
45+
self.toolchain_path = toolchain_path
46+
self.gdb_path = os.path.join(toolchain_path, "bin", "xtensa-lx106-elf-gdb")
47+
self.addr2line_path = os.path.join(toolchain_path, "bin", "xtensa-lx106-elf-addr2line")
48+
49+
if not os.path.exists(self.gdb_path):
50+
raise Exception("GDB for ESP not found in {} - {} does not exist.\nUse --toolchain to point to "
51+
"your toolchain folder.".format(self.toolchain_path, self.gdb_path))
52+
53+
if not os.path.exists(self.addr2line_path):
54+
raise Exception("addr2line for ESP not found in {} - {} does not exist.\nUse --toolchain to point to "
55+
"your toolchain folder.".format(self.toolchain_path, self.addr2line_path))
56+
57+
self.elf_path = elf_path
58+
if not os.path.exists(self.elf_path):
59+
raise Exception("ELF file not found: '{}'".format(self.elf_path))
60+
61+
def parse_text(self, text):
62+
print self.parse_exception(text)
63+
64+
m = re.search('stack(.*)stack', text, flags = re.MULTILINE | re.DOTALL)
65+
if m:
66+
print "Stack trace:"
67+
for l in self.parse_stack(m.group(1)):
68+
print " " + l
69+
else:
70+
print "No stack trace found."
71+
72+
def parse_exception(self, text):
73+
m = re.search('Exception \(([0-9]*)\):', text)
74+
if m:
75+
exception_id = int(m.group(1))
76+
if 0 <= exception_id <= 29:
77+
return "Exception {}: {}".format(exception_id, ESPCrashParser.ESP_EXCEPTIONS[exception_id])
78+
else:
79+
return "Unknown exception: {}".format(exception_id)
80+
81+
'''
82+
Decode one stack or backtrace.
83+
84+
See: https://github.com/me-no-dev/EspExceptionDecoder/blob/master/src/EspExceptionDecoder.java#L402
85+
'''
86+
def parse_stack(self, text):
87+
r = re.compile('40[0-2][0-9a-fA-F]{5}\s')
88+
m = r.findall(text)
89+
return self.decode_function_addresses(m)
90+
91+
def decode_function_address(self, address):
92+
args = [self.addr2line_path, "-e", self.elf_path, "-aipfC", address]
93+
return subprocess.check_output(args).strip()
94+
95+
def decode_function_addresses(self, addresses):
96+
out = []
97+
for a in addresses:
98+
out.append(self.decode_function_address(a))
99+
return out
100+
101+
'''
102+
GDB Should produce line number: https://github.com/me-no-dev/EspExceptionDecoder/commit/a78672da204151cc93979a96ed9f89139a73893f
103+
However it does not produce anything for me. So not using it for now.
104+
'''
105+
def decode_function_addresses_with_gdb(self, addresses):
106+
args = [self.gdb_path, "--batch"]
107+
108+
# Disable user config file which might interfere here
109+
args.extend(["-iex", "set auto-load local-gdbinit off"])
110+
111+
args.append(self.elf_path)
112+
113+
args.extend(["-ex", "set listsize 1"])
114+
for address in addresses:
115+
args.append("-ex")
116+
args.append("l *0x{}".format(address))
117+
args.extend(["-ex", "q"])
118+
119+
print "Running: {}".format(args)
120+
out = subprocess.check_output(args)
121+
print out
122+
123+
def main():
124+
parser = argparse.ArgumentParser()
125+
parser.add_argument("--toolchain", help="Path to the Xtensa toolchain",
126+
default=os.path.join(os.environ.get("HOME"), ".platformio/packages/toolchain-xtensa"))
127+
parser.add_argument("--elf", help="Path to the ELF file of the firmware",
128+
default=".pioenvs/esp/firmware.elf")
129+
parser.add_argument("input", type=argparse.FileType('r'), default=sys.stdin)
130+
131+
args = parser.parse_args()
132+
133+
crash_parser = ESPCrashParser(args.toolchain, args.elf)
134+
crash_parser.parse_text(args.input.read())
135+
136+
137+
if __name__ == '__main__':
138+
main()

platformio.ini

+2-1
Original file line numberDiff line numberDiff line change
@@ -60,9 +60,10 @@ lib_deps =
6060
[env:esp]
6161
src_filter = +<common/*>,+<esp/*>
6262
# no-strict-aliasing required here due to ESP+NMEA2000 incompatibilities
63-
build_flags = -Wall -Wno-strict-aliasing
63+
build_flags = -Wall -Werror -fno-strict-aliasing
6464
-Isrc/common -Isrc/esp
6565
-DHAVE_STRLCPY -DHAVE_STRLCAT
66+
#platform=espressif8266
6667
platform=https://github.com/platformio/platform-espressif8266.git#feature/stage
6768
framework = arduino
6869
board = esp_wroom_02

src/esp/NetServer.cpp

+15-43
Original file line numberDiff line numberDiff line change
@@ -34,29 +34,26 @@ NetServer::NetServer(int port) : server(port) {
3434
}
3535

3636
void NetServer::handleDisconnect(int clientIndex) {
37-
clients[clientIndex]->free();
38-
delete(clients[clientIndex]);
39-
clients[clientIndex] = 0;
40-
queues[clientIndex].clear();
37+
DEBUG("Disconnect for client %i", clientIndex);
38+
// AsyncPrinter will delete the client object in the client->onDisconnect handler.
4139
}
4240

4341
void NetServer::handleNewClient(AsyncClient *client) {
4442
DEBUG("New connection");
4543
int i;
4644
for (i = 0; i < maxClients; i++) {
47-
if (!clients[i] || !clients[i]->connected()) {
48-
clients[i] = client;
45+
if (!clients[i]) {
46+
clients[i] = AsyncPrinter(client, 2048);
4947

50-
client->onAck([this, i](void *s, AsyncClient *c, size_t len, uint32_t time) {
51-
//DEBUG("Got ack for client %i len=%u time=%u", i, len, time);
52-
}, 0);
53-
client->onData([this, i](void *s, AsyncClient *c, void *data, size_t len) {
48+
clients[i].onData([this, i](void *s, AsyncPrinter *c, uint8_t *data, size_t len) {
5449
DEBUG("Got data from client %i len=%i", i, len);
5550
}, 0);
56-
client->onDisconnect([this, i](void *s, AsyncClient *c) {
57-
DEBUG("Disconnect for client %i", i);
51+
clients[i].onClose([this, i](void *s, AsyncPrinter *c) {
5852
handleDisconnect(i);
5953
}, 0);
54+
55+
// Attach some debug messages directly to the client for information.
56+
// These handlers are not set by AsyncPrinter.
6057
client->onError([this, i](void *s, AsyncClient *c, int8_t error) {
6158
DEBUG("Error %s (%i) on client %i", c->errorToString(error), error, i);
6259
}, 0);
@@ -69,7 +66,8 @@ void NetServer::handleNewClient(AsyncClient *client) {
6966
}
7067
}
7168
DEBUG("Rejecting client - Too many connections already.");
72-
// We cannot accept this connection at the moment
69+
// We cannot accept this connection at the moment. Set a handler to free the object when disconnected
70+
// and start disconnection.
7371
client->onDisconnect([](void *s, AsyncClient *c) {
7472
delete(c);
7573
});
@@ -78,50 +76,24 @@ void NetServer::handleNewClient(AsyncClient *client) {
7876

7977
void NetServer::writeAll(const uint8_t *bytes, int len) {
8078
for (int i = 0; i < maxClients; i++) {
81-
if (clients[i] && clients[i]->connected()) {
82-
queues[i].add(NetMessage(bytes, len));
79+
if (clients[i]) {
80+
clients[i].write(bytes, len);
8381
}
8482
}
8583
}
8684

8785
int NetServer::clientsCount() {
8886
int count = 0;
8987
for (int i = 0; i < maxClients; i++) {
90-
//DEBUG("counting - i=%i count=%i clients[i]=%p clients[i]->connected()=%s",
91-
//i, count, clients[i], clients[i] ? (clients[i]->connected() ? "connected" : "not connected") : "n/a");
92-
if (clients[i] && clients[i]->connected()) {
88+
if (clients[i]) {
9389
count++;
9490
}
9591
}
9692
return count;
9793
}
9894

9995
void NetServer::loop() {
100-
for (int i = 0; i < maxClients; i++) {
101-
if (clients[i] && clients[i]->connected()) {
102-
if (clients[i]->canSend() && queues[i].size() > 0) {
103-
//DEBUG("Sending for clients[%i] queue len=%i", i, queues[i].size());
104-
105-
LinkedList<NetMessage>::iterator it = queues[i].begin();
106-
if (clients[i]->write((const char*)it->bytes(), it->len()) > 0) {
107-
queues[i].removeFirst();
108-
}
109-
}
110-
}
111-
else {
112-
queues[i].clear();
113-
}
114-
}
115-
/*
116-
if (!clients[i]->canSend()) {
117-
DEBUG("client[%i]: BUSY in state %s", i, clients[i]->stateToString());
118-
continue;
119-
}
120-
size_t sent = clients[i]->write((char*)bytes, len);
121-
if (sent != len) {
122-
DEBUG("client[%i]: sent %i of %i bytes", i, sent, len);
123-
}
124-
*/
96+
// Writes are performed asynchronously.
12597
}
12698

12799

src/esp/NetServer.h

+2-41
Original file line numberDiff line numberDiff line change
@@ -25,44 +25,7 @@
2525

2626
#include <ESP8266WiFi.h>
2727
#include <ESPAsyncTCP.h>
28-
#include "common/algo/List.h"
29-
30-
/*
31-
* Used to build a buffer (with a LinkedList<NetMessage>) of
32-
* messages that are waiting for each client.
33-
* Using a LinkedList here is pretty inefficient.
34-
* FIXME: Use a circular buffer or dynamic buffer (with a max size) instead of
35-
* this.
36-
*/
37-
class NetMessage {
38-
private:
39-
uint8_t* _bytes;
40-
int _len;
41-
42-
public:
43-
NetMessage(const uint8_t *bytes, int len) : _len(len) {
44-
_bytes = (uint8_t*)malloc(len);
45-
memcpy(_bytes, bytes, len);
46-
};
47-
48-
NetMessage(const NetMessage &m) {
49-
_bytes = (uint8_t*)malloc(m._len);
50-
memcpy(_bytes, m._bytes, m._len);
51-
_len = m._len;
52-
};
53-
54-
~NetMessage() {
55-
free(_bytes);
56-
};
57-
58-
int len() const {
59-
return _len;
60-
};
61-
62-
const uint8_t* bytes() const {
63-
return _bytes;
64-
};
65-
};
28+
#include <AsyncPrinter.h>
6629

6730
class NetServer {
6831
public:
@@ -74,11 +37,9 @@ class NetServer {
7437

7538
private:
7639
static const int maxClients = 8;
77-
AsyncClient *clients[maxClients];
40+
AsyncPrinter clients[maxClients];
7841
AsyncServer server;
7942

80-
LinkedList<NetMessage> queues[maxClients];
81-
8243
void handleNewClient(AsyncClient *client);
8344
void handleDisconnect(int clientIndex);
8445
};

src/esp/main.cpp

+1-1
Original file line numberDiff line numberDiff line change
@@ -153,7 +153,7 @@ void loop() {
153153
lastMessageTimer = 0;
154154
}
155155

156-
if (server.clientsCount() > 0) {
156+
if (server.clientsCount() + webServer.countClients() > 0) {
157157
rgb.setPixelColor(0, clientsConnectedColor);
158158
}
159159
else {

src/host/config/KBoxConfigParser.cpp

+2-2
Original file line numberDiff line numberDiff line change
@@ -38,8 +38,8 @@
3838
#define READ_INT_VALUE(name) READ_VALUE_WITH_TYPE(name, int)
3939

4040
#define READ_INT_VALUE_WRANGE(name, min, max) if (json[#name].is<int>() \
41-
&& json[#name] > min \
42-
&& json[#name] < max) { \
41+
&& json[#name] >= min \
42+
&& json[#name] <= max) { \
4343
config.name = \
4444
json[#name] .as<int>(); \
4545
}

src/host/services/WiFiService.cpp

+17-1
Original file line numberDiff line numberDiff line change
@@ -64,8 +64,24 @@ void WiFiService::loop() {
6464
else {
6565
KBoxMetrics.event(KBoxEventWiFiInvalidKommand);
6666
ERROR("Invalid command received from WiFi module (id=%i size=%i)", kr.getKommandIdentifier(), kr.dataSize());
67+
68+
// This is most likely a boot or reboot message from the ESP module.
69+
// Print it line by line, otherwise the message will be truncated.
70+
71+
unsigned int index = 0;
72+
uint8_t *currentLine = frame;
73+
while (index < len) {
74+
if (frame[index] == '\n') {
75+
frame[index] = '\0';
76+
DEBUG("> %s", currentLine);
77+
78+
currentLine = frame + index + 1;
79+
}
80+
index++;
81+
}
82+
6783
frame[len-1] = 0;
68-
DEBUG("> %s", frame);
84+
DEBUG("> %s", currentLine);
6985
}
7086

7187
_slip.readFrame(0, 0);

tools/nmea-tester/nmea.py

+2-1
Original file line numberDiff line numberDiff line change
@@ -72,6 +72,7 @@ def send_sentence(output, nmea):
7272

7373
def replay(input, output):
7474
for nmea in nmea_read_with_delay(input):
75+
output.reset_input_buffer()
7576
send_sentence(output, nmea)
7677

7778
def nmea_checksum(data):
@@ -133,7 +134,7 @@ def main():
133134

134135
port = None
135136
if args.port:
136-
port = serial.Serial(port = args.port, baudrate = args.baud, timeout = 1)
137+
port = serial.Serial(port = args.port, baudrate = args.baud, timeout = 1, write_timeout = 1, xonxoff=False, rtscts=False, dsrdtr=False)
137138

138139
if args.command == 'replay':
139140
if port:

0 commit comments

Comments
 (0)